diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..52373fe24473b1aa44333d318f578ae6bf04b49b 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/abliteration_config.json b/abliteration_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0907d75d3d714121b59c70913eb38179534e1182 --- /dev/null +++ b/abliteration_config.json @@ -0,0 +1,8 @@ +{ + "model_name": "zai-org/GLM-4.7", + "strength_min": 0.5, + "strength_max": 3.5, + "winsorize_percentile": 0.995, + "target_layers": "auto", + "timestamp": "2025-12-24T04:46:30.308483" +} \ No newline at end of file diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..2ab98ef068d62829d17c5ade1827b9f013fa2bbf --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,86 @@ +[gMASK] +{%- if tools -%} +<|system|> +# Tools + +You may call one or more functions to assist with the user query. + +You are provided with function signatures within XML tags: + +{% for tool in tools %} +{{ tool | tojson(ensure_ascii=False) }} +{% endfor %} + + +For each function call, output the function name and arguments within the following XML format: +{function-name}{arg-key-1}{arg-value-1}{arg-key-2}{arg-value-2}...{%- endif -%} +{%- macro visible_text(content) -%} + {%- if content is string -%} + {{- content }} + {%- elif content is iterable and content is not mapping -%} + {%- for item in content -%} + {%- if item is mapping and item.type == 'text' -%} + {{- item.text }} + {%- elif item is string -%} + {{- item }} + {%- endif -%} + {%- endfor -%} + {%- else -%} + {{- content }} + {%- endif -%} +{%- endmacro -%} +{%- set ns = namespace(last_user_index=-1) %} +{%- for m in messages %} + {%- if m.role == 'user' %} + {% set ns.last_user_index = loop.index0 -%} + {%- endif %} +{%- endfor %} +{% for m in messages %} +{%- if m.role == 'user' -%}<|user|>{{ visible_text(m.content) }} +{%- elif m.role == 'assistant' -%} +<|assistant|> +{%- set reasoning_content = '' %} +{%- set content = visible_text(m.content) %} +{%- if m.reasoning_content is string %} + {%- set reasoning_content = m.reasoning_content %} +{%- else %} + {%- if '' in content %} + {%- set reasoning_content = content.split('')[0].rstrip('\n').split('')[-1].lstrip('\n') %} + {%- set content = content.split('')[-1].lstrip('\n') %} + {%- endif %} +{%- endif %} +{%- if ((clear_thinking is defined and not clear_thinking) or loop.index0 > ns.last_user_index) and reasoning_content -%} +{{ '' + reasoning_content.strip() + ''}} +{%- else -%} +{{ '' }} +{%- endif -%} +{%- if content.strip() -%} +{{ content.strip() }} +{%- endif -%} +{% if m.tool_calls %} +{% for tc in m.tool_calls %} +{%- if tc.function %} + {%- set tc = tc.function %} +{%- endif %} +{{- '' + tc.name -}} +{% set _args = tc.arguments %}{% for k, v in _args.items() %}{{ k }}{{ v | tojson(ensure_ascii=False) if v is not string else v }}{% endfor %}{% endfor %} +{% endif %} +{%- elif m.role == 'tool' -%} +{%- if m.content is string -%} +{%- if loop.first or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|observation|>' }} +{%- endif %} +{{- '' }} +{{- m.content }} +{{- '' }} +{%- else -%} +<|observation|>{% for tr in m.content %} +{{ tr.output if tr.output is defined else tr }}{% endfor -%} +{% endif -%} +{%- elif m.role == 'system' -%} +<|system|>{{ visible_text(m.content) }} +{%- endif -%} +{%- endfor -%} +{%- if add_generation_prompt -%} + <|assistant|>{{- '' if (enable_thinking is defined and not enable_thinking) else '' -}} +{%- endif -%} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cbf0ec52595057d738c563bdcfb976c2c73aa7de --- /dev/null +++ b/config.json @@ -0,0 +1,43 @@ +{ + "architectures": [ + "Glm4MoeForCausalLM" + ], + "attention_bias": true, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "eos_token_id": [ + 151329, + 151336, + 151338 + ], + "first_k_dense_replace": 3, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 5120, + "initializer_range": 0.02, + "intermediate_size": 12288, + "max_position_embeddings": 202752, + "model_type": "glm4_moe", + "moe_intermediate_size": 1536, + "n_group": 1, + "n_routed_experts": 160, + "n_shared_experts": 1, + "norm_topk_prob": true, + "num_attention_heads": 96, + "num_experts_per_tok": 8, + "num_hidden_layers": 92, + "num_key_value_heads": 8, + "num_nextn_predict_layers": 1, + "pad_token_id": 151329, + "partial_rotary_factor": 0.5, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 1000000, + "routed_scaling_factor": 2.5, + "tie_word_embeddings": false, + "topk_group": 1, + "transformers_version": "4.57.3", + "use_cache": true, + "use_qk_norm": true, + "vocab_size": 151552 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a7958b7d81d1338ae40db2fd0d9d030effc9e41d --- /dev/null +++ b/generation_config.json @@ -0,0 +1,10 @@ +{ + "_from_model_config": true, + "eos_token_id": [ + 151329, + 151336, + 151338 + ], + "pad_token_id": 151329, + "transformers_version": "4.57.3" +} diff --git a/model-00001-of-00142.safetensors b/model-00001-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8bdf4f250b34ad3734fe7a26c70eac7cbfe34c5c --- /dev/null +++ b/model-00001-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3745695dc799241a6899501ddb6cbe3b3d0cf4ae114e78b57b7751e81134b6d1 +size 4986172552 diff --git a/model-00002-of-00142.safetensors b/model-00002-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c0b6a763403803ae5f9d2e5026f1c184e4938cbb --- /dev/null +++ b/model-00002-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:786c5f3db310f1687ec28b2a116c675c2e179163ab4212979d50ddf2fa626dc9 +size 4986018288 diff --git a/model-00003-of-00142.safetensors b/model-00003-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c3087f1190ddbfb9b3d3ebfb78ccae0d1f41fb0a --- /dev/null +++ b/model-00003-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:426a8ce8b7ca5567cabe64bb49dcff9929d1e027f50bbf31a17241a35fa298fd +size 4992949184 diff --git a/model-00004-of-00142.safetensors b/model-00004-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d4cafbbc4fcedfe5b26f46d984fc8e5e606bb3a9 --- /dev/null +++ b/model-00004-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3fd184b4c2ed323c301bc639e8237d3103a45e1d4bd00c955a489eca3787ed6 +size 4992949280 diff --git a/model-00005-of-00142.safetensors b/model-00005-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..47e33b83422842e1aa1e3abbcd4786246951c1cb --- /dev/null +++ b/model-00005-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa53425e1cec0b9697762e69c1a5ce2e82fcdd4a741035f29004dc4c982a0a1f +size 4986018232 diff --git a/model-00006-of-00142.safetensors b/model-00006-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..209402b884f157e04f214a8e2a5337542707e760 --- /dev/null +++ b/model-00006-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1c14ea1156b6c07f836de5c4802af8cd000799d1d730c158124c9fe707c1d66 +size 4992949232 diff --git a/model-00007-of-00142.safetensors b/model-00007-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ea0666209dc0940e398061b2c6d403e30f756978 --- /dev/null +++ b/model-00007-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30dfadcc6f18d982a46750c8e1a1e22ad2cfcb95cec25fb251e1fa977b6e83be +size 4986018368 diff --git a/model-00008-of-00142.safetensors b/model-00008-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7583cea4db59a3c07a5f3aa30595203a1eb7ed6e --- /dev/null +++ b/model-00008-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a63fe6a363453c780eb12193afb36e52c17b70495b374b34090c2a2d03d48a7 +size 4992949096 diff --git a/model-00009-of-00142.safetensors b/model-00009-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f657f8db8c63247dea211bb6ea11b996f951d0f1 --- /dev/null +++ b/model-00009-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c59123542e3f62d13f47c15f3af496ffb6fcfce207e0df9722d042e59c935ff0 +size 4992949280 diff --git a/model-00010-of-00142.safetensors b/model-00010-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7c3daca919df13947ab08ad0cca85d3298a97477 --- /dev/null +++ b/model-00010-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90759f439669bf60fa3823ef39060209a352fdcffb08ac00ecdafce4f97e5e4f +size 4986018320 diff --git a/model-00011-of-00142.safetensors b/model-00011-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ea3b70b62c63fd649abab158372cc5aa61caa70b --- /dev/null +++ b/model-00011-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43ae6b98e82830a15df32379f2ad0d52516dac33ea367104e374ee3e1506bbf4 +size 4992949144 diff --git a/model-00012-of-00142.safetensors b/model-00012-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ce6de536ddc030195e616eb6f91d84c1328cf40 --- /dev/null +++ b/model-00012-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf8214a7d9ad87df56e9f58ee2fc6302034e07efdd4e0edb169b1451b6c31471 +size 4992949360 diff --git a/model-00013-of-00142.safetensors b/model-00013-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7e6050c9f5d1f9439556a47da79293265f07daed --- /dev/null +++ b/model-00013-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:215b90a977a02019f7575526fe814cf5b0567a9371e2d9b78da5e39e306906ef +size 4986018584 diff --git a/model-00014-of-00142.safetensors b/model-00014-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..efa2a1357963193a7124c138e4f07ba50926235b --- /dev/null +++ b/model-00014-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf07e9a8ab421d48b0e41f58b9c6066ed37d6f6bb2ace4210e8f6c6402daeea1 +size 4992949512 diff --git a/model-00015-of-00142.safetensors b/model-00015-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a4e2df975af2c4a620219e498216fdbedc198f42 --- /dev/null +++ b/model-00015-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7fd7f1d51814a98ba5697f7eef55b677dc3548602f03fb5a02f287800612524 +size 4992949608 diff --git a/model-00016-of-00142.safetensors b/model-00016-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f985a8f0068db885fbc705c09788234b6c29d37f --- /dev/null +++ b/model-00016-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65c5817c7b245ed74de1c10208fc81e4023915103daac41bd9cef27feb3dd9fe +size 4986018520 diff --git a/model-00017-of-00142.safetensors b/model-00017-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a4256d75dbf84c5353cce7169d9d6957eb349a23 --- /dev/null +++ b/model-00017-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e6d12ce3ed87aac3fb760db74cc4d18312a21861635e0f83970c55c9c2e8026 +size 4992949560 diff --git a/model-00018-of-00142.safetensors b/model-00018-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aff042e5c517ba4d5a028a2ed394e6d76f4206fd --- /dev/null +++ b/model-00018-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ef01a28f95865ae58f01f7dd7f87cc021b4b79c07cda99b78c9e5d411181e5e +size 4986018672 diff --git a/model-00019-of-00142.safetensors b/model-00019-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ebb6fc69499f26fb6577382bdbffec73d9c9eb70 --- /dev/null +++ b/model-00019-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8622cf510427e5509f494c9686a1c24e1261bd735847fe96721830d2c459afdf +size 4992949424 diff --git a/model-00020-of-00142.safetensors b/model-00020-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..180bda8928b58b536c6cc86817b95742b1e7c71f --- /dev/null +++ b/model-00020-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6c26553f76d02fa5fe90138aaeb616ad271b3cdf2930f0b86a23427719f1d1d +size 4992949592 diff --git a/model-00021-of-00142.safetensors b/model-00021-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4e2ebd31220b9548651ea61fb3e3c7133701aaad --- /dev/null +++ b/model-00021-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea78da1df9a22ab5eb289ac7894c6d66686e4da1e3b539de5c5fd8350e9105fa +size 4986018624 diff --git a/model-00022-of-00142.safetensors b/model-00022-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f04985c10efa47911d8183919c44a1bd7ed503f5 --- /dev/null +++ b/model-00022-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8dfd0c71cd28827d81f8c60ea4e60861538f4f60bfea05fca604dbb7b167648 +size 4992949472 diff --git a/model-00023-of-00142.safetensors b/model-00023-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..72091117e788cf86fa74fc441f8282e22f049bd0 --- /dev/null +++ b/model-00023-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26152b1c5a70687b130be644261a866d638f746c70dd0cf9a3aae915a70fd1a3 +size 4992949592 diff --git a/model-00024-of-00142.safetensors b/model-00024-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..829dad9e89ee5328d24cae721fdbcac03a953380 --- /dev/null +++ b/model-00024-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c066dabbe470d5621b343ceb7a4b3cb6357aae9bda240244795f7299cefd8a61 +size 4986018576 diff --git a/model-00025-of-00142.safetensors b/model-00025-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9dfcfb8d60ce25d40d2292fa0396397982053344 --- /dev/null +++ b/model-00025-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51cec3665e6fe1bb94238ccb32f184d66ce4885d81f7cb00720e7c230573580e +size 4992949528 diff --git a/model-00026-of-00142.safetensors b/model-00026-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..68a8549d76f45e187705cf2e21df5c5da843e95d --- /dev/null +++ b/model-00026-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:923cf7e9f127a8165f02bfbe729ebd9739c2a63d072469609a12cafcf7178066 +size 4992949624 diff --git a/model-00027-of-00142.safetensors b/model-00027-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bc0d86ecb2c5a9fcd625e79090cc44ad6e1ed87f --- /dev/null +++ b/model-00027-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d06830fca685aeb3543b2ee228771e9409e9fe9f2e49f4aa31ac3e8ace50416 +size 4986018496 diff --git a/model-00028-of-00142.safetensors b/model-00028-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..74151da990c368e65f1f3c76a2ae5e8b1849f354 --- /dev/null +++ b/model-00028-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27ae58e62ad2d1290e19ce3293f61ddab2958de2ef1820d118d773502dac156b +size 4992949576 diff --git a/model-00029-of-00142.safetensors b/model-00029-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5a891849a8dd9ef8eca470c406c6e275799ed781 --- /dev/null +++ b/model-00029-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f22e2af4e89fb89e1a8ea03fccd4ee497303e3a01dbdb91beb7542ca6993d7e4 +size 4986018656 diff --git a/model-00030-of-00142.safetensors b/model-00030-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f0699437e91fb1ea8b1dfd8fd06d52830ea1b861 --- /dev/null +++ b/model-00030-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6e67b3e9de4864a4466e13af36083300c6ece3c116c7a4121307fe59c4532bb +size 4992949432 diff --git a/model-00031-of-00142.safetensors b/model-00031-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..50d11eb8d6e7251c6cc2c3c7987d4cb16e079598 --- /dev/null +++ b/model-00031-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:360f614917dd9e611c9178e2516946654e58153464c4aa409ef066f522fc0d9d +size 4992949592 diff --git a/model-00032-of-00142.safetensors b/model-00032-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..94bef1e6d04eee4f700efd4b5d51a9e8b7f89abd --- /dev/null +++ b/model-00032-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e235f3618f001e37602893a0277ec1222d1917322951b2a2a6ea6c266aaaf450 +size 4986018608 diff --git a/model-00033-of-00142.safetensors b/model-00033-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d02b6ce6323ddf9484b99c7c7b5ba372bd5c218d --- /dev/null +++ b/model-00033-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:137a9e622d286ca39a28cefa77196d877b26895e84ca94c543abdda4c52fb408 +size 4992949488 diff --git a/model-00034-of-00142.safetensors b/model-00034-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e70bf10dc63f03183dfbf56408eca60df948b396 --- /dev/null +++ b/model-00034-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59b7197119bf45f10ca7688a348f9d328601b573c6fc2dc9d4efbcd1dec7f2af +size 4992949592 diff --git a/model-00035-of-00142.safetensors b/model-00035-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3760e4ba2f334b78e857ac9065388a018c8f1e9a --- /dev/null +++ b/model-00035-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35600feb01bdb2945f1286566516baf18e93b88c23345c38566ba3ab6e333c40 +size 4986018560 diff --git a/model-00036-of-00142.safetensors b/model-00036-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d29251d23c009efc61cd9be49ba025b648dc6109 --- /dev/null +++ b/model-00036-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:776239ad36609746cdde923c0f984c659120af3f9f3d87109a9d1d01479088d6 +size 4992949536 diff --git a/model-00037-of-00142.safetensors b/model-00037-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9a7b1f615553628a8d4ced2e14187bfae6e659cf --- /dev/null +++ b/model-00037-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d272b7ebea4df861bcb3edd8555a84aadbedfd929fc81e25fd229d2e69bb97f5 +size 4893306064 diff --git a/model-00038-of-00142.safetensors b/model-00038-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a0116acc81e3d50903ac025fee4f33a9ba0715d1 --- /dev/null +++ b/model-00038-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:050f44ecf44b55018dd5bdf1caa458849b7d4d1d3a149244adaa8a3eb4f3c641 +size 4991289440 diff --git a/model-00039-of-00142.safetensors b/model-00039-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..23335e74570c69b30cf366c4f59a746554c031a2 --- /dev/null +++ b/model-00039-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:704555e1bfb3d5e86e4b99c9474abbb8d66ab31390e5c9e1cb4155ab6679173a +size 4992949592 diff --git a/model-00040-of-00142.safetensors b/model-00040-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8cf1ddbff90a0caf34d64604bb5c25d73e6386ea --- /dev/null +++ b/model-00040-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93db6df776ca95a3107789d3e9a63c1a2cea61975bcd148496786e5fc2361b12 +size 4986018640 diff --git a/model-00041-of-00142.safetensors b/model-00041-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..383da84529cb9b6a0b9a69e7ecc080de26127d3c --- /dev/null +++ b/model-00041-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d582b5e1d32311ebb610115af8a14afeb8110ee9a958a72fc81288e525a091ac +size 4992949456 diff --git a/model-00042-of-00142.safetensors b/model-00042-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f6ac76740701ccd1b11e833c09cc11ad55887cb1 --- /dev/null +++ b/model-00042-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23c4d97420a09b479126ebd41a68d002864cec90da3d608dbf324ab286764cbf +size 4992949592 diff --git a/model-00043-of-00142.safetensors b/model-00043-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..df14a9257bcbf1bddcc3243f968090110d2f48c7 --- /dev/null +++ b/model-00043-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2064f781e2a33fd5ac27b8285181b18e56d5bc434134cf6206aa775d0b1e0529 +size 4986018592 diff --git a/model-00044-of-00142.safetensors b/model-00044-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..75348bc945bd9d52cfdff58f588ac86e130331ab --- /dev/null +++ b/model-00044-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b3ee700ffda38324ce809b9da2d379b02164564f6c0f4569664b8a6667d29ed +size 4992949504 diff --git a/model-00045-of-00142.safetensors b/model-00045-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5d10212d28d1fc1ec9fac610173632cfbb997d0 --- /dev/null +++ b/model-00045-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9789cecfc144d4a1858aab56a0facc29d5f037a0f0bdea76481c0407680b3e8 +size 4992949600 diff --git a/model-00046-of-00142.safetensors b/model-00046-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7a873d029abec6ad392797089025f40ddaa23625 --- /dev/null +++ b/model-00046-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3628fcde2c43224c9b61ff6f9d556435e090c10a3c3db5abf86a8ff9f5560084 +size 4986018528 diff --git a/model-00047-of-00142.safetensors b/model-00047-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..de6e05d2d7cd2cb7afe150fe99c6f939541564ba --- /dev/null +++ b/model-00047-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e570e28a704333c4ee66d6de89461579cf9dc0769ac67daed235e9af5b1690a4 +size 4992949560 diff --git a/model-00048-of-00142.safetensors b/model-00048-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..66ea4e44d03d94423a71f2bba93aeaabaa63cc76 --- /dev/null +++ b/model-00048-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1569d7a78c31c91c3a813dbb28f59f9fbb827190d3f42c862279ab12712ddd11 +size 4986018680 diff --git a/model-00049-of-00142.safetensors b/model-00049-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6c98eaec4e967acd3f18f0e493ad7b3d5e4b18af --- /dev/null +++ b/model-00049-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42a1f9ea0b86830d9c037879eb6e65f4da085ce364d7607a75b42d970fbfe14d +size 4992949416 diff --git a/model-00050-of-00142.safetensors b/model-00050-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8e2774ad996528fff4443f201aebbc075917f083 --- /dev/null +++ b/model-00050-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c175c5d27b6b212b8995feb8aec5aa9a594c7ffd9e415253845a576dab01b26 +size 4992949592 diff --git a/model-00051-of-00142.safetensors b/model-00051-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d0635c9501bfbf0d8fcfa23c026f243f1b241706 --- /dev/null +++ b/model-00051-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f2ee9e8ab49036c9559b664204bacf1ea80b2900ee2b8649f8681be27b4f4f1 +size 4986018632 diff --git a/model-00052-of-00142.safetensors b/model-00052-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..50151bcbc8911f855336130f9dd606524b61e3d3 --- /dev/null +++ b/model-00052-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d1259348933da0b10b40c1fbc7b6c1e3d9d347e8eb61c76423d1533fdbb897b +size 4992949464 diff --git a/model-00053-of-00142.safetensors b/model-00053-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9163094ccefa5c7c68ead845e808dccd2676a415 --- /dev/null +++ b/model-00053-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8348ade6a3eea8004d03ec452b2404ac8a45ab45c1217b197a97d712df484fb +size 4992949592 diff --git a/model-00054-of-00142.safetensors b/model-00054-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3d0182c2be7820f51ab4780451bfc5fc6b41b74b --- /dev/null +++ b/model-00054-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b309e1f6831594293e6d150e054b4f85221b650684015e1538493a409d703c +size 4986018576 diff --git a/model-00055-of-00142.safetensors b/model-00055-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7596ea5b6ab00a121ca94e2f8fe4866acddd9ce8 --- /dev/null +++ b/model-00055-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acdb4f6a0d700c4c45154c4f6f3da4b3c34996ac9689d3f0dd874020f01a1abb +size 4992949520 diff --git a/model-00056-of-00142.safetensors b/model-00056-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d2760bcdb569fbb8fb54209b87d5e1e87762567e --- /dev/null +++ b/model-00056-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7c02e3dea881c75b518721c9ea0f3181f6362cb9cdf05cbbf7ffa6608a11381 +size 4992949616 diff --git a/model-00057-of-00142.safetensors b/model-00057-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..62a613aa8b4b6ad9e09f2c035220cac026c83841 --- /dev/null +++ b/model-00057-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aff5b3787e55d943099c31b96e9c745d4e89b6483ee39d62c99af21d2e1a33d +size 4986018504 diff --git a/model-00058-of-00142.safetensors b/model-00058-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..34cc4a6693d0e70cb3da0a040be6827d0f915d76 --- /dev/null +++ b/model-00058-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cd98e4d5a4c183ec102e2855fc11382ee1b3fdf690cd904eea712b2bc6a4f54 +size 4992949568 diff --git a/model-00059-of-00142.safetensors b/model-00059-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a27fa8d57849077d5b0dd8240adc4c90fe2aa434 --- /dev/null +++ b/model-00059-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2628b94169dc510efd82349fc225063964193ddcb86b135ee6a273cc40479ded +size 4986018664 diff --git a/model-00060-of-00142.safetensors b/model-00060-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03da97283fe645c10e307f8a9c8165df39f66d9f --- /dev/null +++ b/model-00060-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8b028b65391d91148215dd19c2debce70f84783a405263ab09d4dfd561cb2a2 +size 4992949432 diff --git a/model-00061-of-00142.safetensors b/model-00061-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7085951f4040fd7492074c84fc14a76f95e0513d --- /dev/null +++ b/model-00061-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1392b4f6c661cffba9c9569e420d7786f4e1d414f8a13196fab35ee1828e0cc4 +size 4992949592 diff --git a/model-00062-of-00142.safetensors b/model-00062-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aae95971529d5098cd997498492dc280e269d45b --- /dev/null +++ b/model-00062-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0710964ff35c525b1803cb8f58f4e13009b1e06be62ab2d16189493bb2a113d1 +size 4986018616 diff --git a/model-00063-of-00142.safetensors b/model-00063-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..870cc6914fa4a604ed173c697cbf06fc1224c3bc --- /dev/null +++ b/model-00063-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c1fe180e05617c9f49592d415764a749308e0aa58f1645107ce7509886d83fd +size 4992949488 diff --git a/model-00064-of-00142.safetensors b/model-00064-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ca32ddf4fa2644809018ddf5696d2690ee837189 --- /dev/null +++ b/model-00064-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc120f6ecb23107d0f2dadf3030bc7bb1c2f06598856ecdda0165aebddd92d25 +size 4992949592 diff --git a/model-00065-of-00142.safetensors b/model-00065-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5e416872baea0ae42749d8630d60a713148fa759 --- /dev/null +++ b/model-00065-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0e6d83b5d32859315d8fb3b2279b5fc86e31d32c480dae9b74a9c34bec7b826 +size 4986018568 diff --git a/model-00066-of-00142.safetensors b/model-00066-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..09a9366a0d1db826d24ed9330e97635cc5c2f19c --- /dev/null +++ b/model-00066-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f936754421bfd10a683c22db957fffdbb8ab846d189917372249dffe00c7e3b3 +size 4992949536 diff --git a/model-00067-of-00142.safetensors b/model-00067-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ec81f80079b3656914194df02e1dbeb1d84e473c --- /dev/null +++ b/model-00067-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae5ad1bc7a34056ab25355d5ea3a5d2ca01e041e75e041292e9b99a7667d044a +size 4977221008 diff --git a/model-00068-of-00142.safetensors b/model-00068-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8aa60c2bb19473e331d784f3e2f361b70d6ce3a5 --- /dev/null +++ b/model-00068-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a8110300ef296c9f23ba2a2b9e29d14ceb5f8a55c3c7af2a96c29d4a516d94e +size 4986018336 diff --git a/model-00069-of-00142.safetensors b/model-00069-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f025c8d59f31993e9c498786ee519310fd5e8dcd --- /dev/null +++ b/model-00069-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0872836c61e664cafd0a0d23eb746a1a3ac04d2967d0a82f7f2f18912a31f4e1 +size 4992949584 diff --git a/model-00070-of-00142.safetensors b/model-00070-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a98e543976a35af1f5368ad9fc4295dd979f95e1 --- /dev/null +++ b/model-00070-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f36caefe9bd747d1e2917ab655dc222d628480f75114826e1dcf517350e31d61 +size 4986018648 diff --git a/model-00071-of-00142.safetensors b/model-00071-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2c7325ef7e142434eb77011dc32cde96ab748456 --- /dev/null +++ b/model-00071-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb4bd770c4a83e0f54d43055f47893d02f7c791c314d112014437e495c855434 +size 4992949448 diff --git a/model-00072-of-00142.safetensors b/model-00072-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aa4f69efbb4a675d4d14db65255fcea9a4b6d3ce --- /dev/null +++ b/model-00072-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe639ac383657fe490d492b760044266b73ca609b58e767c3b03ef5aa853d268 +size 4992949592 diff --git a/model-00073-of-00142.safetensors b/model-00073-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1a0db41a7aa5fe6a9e99217596b99b3326cc63fa --- /dev/null +++ b/model-00073-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:195eb9f76f080f00b97c09843195e6840d388251796cfc6a4ac2f4c71f8f92b7 +size 4986018600 diff --git a/model-00074-of-00142.safetensors b/model-00074-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c83c0c8f462e78f48de62c83103106dcb47e2cc7 --- /dev/null +++ b/model-00074-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2638c53dca6d7150ee8330248fc9b9a196142ddcd4414c59465b77bf426454e +size 4992949496 diff --git a/model-00075-of-00142.safetensors b/model-00075-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..58c209724cdc6e79281ee8723b81326473110529 --- /dev/null +++ b/model-00075-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f32325abd125b8775159590c4096c8b183cf92eabbd5d96e4b554b39b4fbc9b9 +size 4992949592 diff --git a/model-00076-of-00142.safetensors b/model-00076-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2052928076925c781d1c9657993adcf461d01475 --- /dev/null +++ b/model-00076-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29615974af9f09200d9a2011a5e944012ab19857e8393a99a7b8d045fbb4d3d2 +size 4986018552 diff --git a/model-00077-of-00142.safetensors b/model-00077-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3e85d4cae496c2017164592882d20f63b99ed9ee --- /dev/null +++ b/model-00077-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49080b6021ffb154402705d45ea54a476094c0c5f9b0a6a752b5d3aad774d779 +size 4992949544 diff --git a/model-00078-of-00142.safetensors b/model-00078-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f14128d85fa2d622cf8d0ea5f393d3caff39e265 --- /dev/null +++ b/model-00078-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54e82d9761001dc0be94ab3961e595efe5291b98d83153e418b63e73e140e136 +size 4986018688 diff --git a/model-00079-of-00142.safetensors b/model-00079-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd69c3d32ef7ce3acc39fdb968d7e5cb13bc3a93 --- /dev/null +++ b/model-00079-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95dca7277c150a482b986528d76c549a491ea18f8e1869c2fcab2271052d66e8 +size 4992949408 diff --git a/model-00080-of-00142.safetensors b/model-00080-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d48e1d58e1d57d2c993e15864c154c2818740b2 --- /dev/null +++ b/model-00080-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a72df3d167464c8a7ba8c771660a14372dd5ab01b7f0b72ae5800fd9cc3db863 +size 4992949592 diff --git a/model-00081-of-00142.safetensors b/model-00081-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0b3994e9f4adbc7432d45627ddbf9ddc17361140 --- /dev/null +++ b/model-00081-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1258d90c5948e9715a054cfa503c091c975ee4cf48fc01e26c78c68db2ba39b2 +size 4986018640 diff --git a/model-00082-of-00142.safetensors b/model-00082-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..90f9e55de66c178f2e35e7099659f65d209ca419 --- /dev/null +++ b/model-00082-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a940583af148ab17f22da5c80c97b303f4febb3b5423c18fb8fb2f6170486ab1 +size 4992949456 diff --git a/model-00083-of-00142.safetensors b/model-00083-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..914d7f97484f903ec715f6e1d0c13b96fc0b1f5f --- /dev/null +++ b/model-00083-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0673cd94229b4fe8d124742786ec4ee8422a837e074b5f8f439921c3c1e2900d +size 4992949592 diff --git a/model-00084-of-00142.safetensors b/model-00084-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9f9802e9ab1cb3148fcc53395b0b780236c24c82 --- /dev/null +++ b/model-00084-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0864316152beca2852a3ad9840d640836c06d69e55c7699ab459d534ad7dfee4 +size 4986018584 diff --git a/model-00085-of-00142.safetensors b/model-00085-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bcefe1d549c12e8e42dddfabe2b1c25cd9f0ffd5 --- /dev/null +++ b/model-00085-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5b9888c58337d5a673379e37e95c525c144033a8872064994162f47433503cc +size 4992949512 diff --git a/model-00086-of-00142.safetensors b/model-00086-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..21010104885c1519df8de3c42a0a500ee7d1a423 --- /dev/null +++ b/model-00086-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cc6ffa000a27bc5fc84b324ed2d2e1218ad9ee35197fd22fc99403fc3928376 +size 4992949608 diff --git a/model-00087-of-00142.safetensors b/model-00087-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..41ee54f8b0d64f9ff1a3f61e070d2e93816a0451 --- /dev/null +++ b/model-00087-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97b0b3250771ab8eaef2d063656986ac4e87bb18c34d8d9aa49bd1993b79e986 +size 4986018520 diff --git a/model-00088-of-00142.safetensors b/model-00088-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5696a68bf7ee0ef0970acc28eee1e1cc1cd7d36b --- /dev/null +++ b/model-00088-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fba4b7e7744a0fa7ecf7ea9db8a54b7608323bf785930d8f95612f7ed5d9118f +size 4992949560 diff --git a/model-00089-of-00142.safetensors b/model-00089-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..441fa61b411763d1d2970f2ed828204ae1f0056e --- /dev/null +++ b/model-00089-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f76718ea0006511c5ced4c420492d339a7ab58be59cb660dbb34f1803409058c +size 4986018672 diff --git a/model-00090-of-00142.safetensors b/model-00090-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..816266ac39cfd178370fef22a5350a2fc77d73d2 --- /dev/null +++ b/model-00090-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ef363c91bdb3c3f0eb1d249ae848cdfea85555872f9708887853ad3333bee4c +size 4992949424 diff --git a/model-00091-of-00142.safetensors b/model-00091-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e4b56c08395b3244f297cfe5480d464f7421b046 --- /dev/null +++ b/model-00091-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4db72e9242b9e67fc9c28ff27d5402f5ee34c01fc15c1766eb632ed277f922a +size 4992949592 diff --git a/model-00092-of-00142.safetensors b/model-00092-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..43c3a61dc3cbf80974c2638b1d5ef0d942bbc5b2 --- /dev/null +++ b/model-00092-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e242f8c047956888c1482447638c3470baf20dc2eed050030a262eceab0ddc20 +size 4986018624 diff --git a/model-00093-of-00142.safetensors b/model-00093-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3ac5bef09f2b38faf66c6c1223d4bf037ee28e42 --- /dev/null +++ b/model-00093-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b9ce4c78463556fcb3d19c22d7ac4297d4a7187c3339fd1cdd89eec980e245e +size 4992949472 diff --git a/model-00094-of-00142.safetensors b/model-00094-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..47bd908d9ed50c2fb1aadd9b14f27084207eda42 --- /dev/null +++ b/model-00094-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9844b7090261b8d67a4e3dd869b5e438b455fd1b00239b9e901b03f4d89fc513 +size 4992949592 diff --git a/model-00095-of-00142.safetensors b/model-00095-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8479dad39f3cdab88563616e98adadeba143be1f --- /dev/null +++ b/model-00095-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c71c982db2d31cb1fe86efc82a08271e66d15e12e60ba6e15b6eb311b58fd274 +size 4986018576 diff --git a/model-00096-of-00142.safetensors b/model-00096-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9893931e4b7ae7837d9ee1ea2242a702fad4fb98 --- /dev/null +++ b/model-00096-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ed78c3b9c8cc5a6e1d4759b60e5701df5d0f07b2ad7a811ca130a68f430dab4 +size 4992949528 diff --git a/model-00097-of-00142.safetensors b/model-00097-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8eb1656ef0c16ec876036cb0d75844af34c52874 --- /dev/null +++ b/model-00097-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6322215b699908c97799cb45e5e51e9cedcaf1785bfb3912af967f2bc82f34f3 +size 4992949624 diff --git a/model-00098-of-00142.safetensors b/model-00098-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8431b6a8a791ca5c344073f5982c2681de8193d8 --- /dev/null +++ b/model-00098-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57bd3fb670706eb78c199bea011017c46d58d34f5920773da639408863fd5033 +size 4986018496 diff --git a/model-00099-of-00142.safetensors b/model-00099-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c9e79ed300e4c5085ec356007bbf584ab78aba42 --- /dev/null +++ b/model-00099-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c53cc155e0fc72cb16a2992559d1015bfedacd08fb1e307bf5dc4ad50a47578 +size 4992949576 diff --git a/model-00100-of-00142.safetensors b/model-00100-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1062dc565dab077abad874705285725eb0567730 --- /dev/null +++ b/model-00100-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6081b46dbd356aba0c1cb240a9439088515c2a1b124d85a796ba4429f0430364 +size 4986018656 diff --git a/model-00101-of-00142.safetensors b/model-00101-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..63d97b184c039eb91b5a73faf04deb0b3ba8dc89 --- /dev/null +++ b/model-00101-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bda10b6e70599813850f1eff4689f5d086f6828b3ac5a9239880bf4094dbbcfd +size 4992949432 diff --git a/model-00102-of-00142.safetensors b/model-00102-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5eef64c9be351b770734159a52fa83e9833f3de3 --- /dev/null +++ b/model-00102-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eb071cdfb3d26779e5b3a31e66e6dcbc772324aa1360a488aeac8f6b93d9db7 +size 4992949592 diff --git a/model-00103-of-00142.safetensors b/model-00103-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c911c0c6908cc0be403f376b74ef5375740c3d0 --- /dev/null +++ b/model-00103-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf0428efa22d2c02ffae43b02b599a60369666eb002b751d467fe336a93e4bf0 +size 4986018608 diff --git a/model-00104-of-00142.safetensors b/model-00104-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..614d9eb9ae45d4eb449a035bd582008f44207890 --- /dev/null +++ b/model-00104-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ea1d6e731fb8da77a845020620686d1bdcfc0bd8f5432a91e6508c9a22ea75b +size 4992949488 diff --git a/model-00105-of-00142.safetensors b/model-00105-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2a685e57311195e2f74926edd6f8b035100e418b --- /dev/null +++ b/model-00105-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e068796fd8ad39da2776bc7d28b1a2af20b27c356ab2cab0c940b378e5020ee +size 4992949592 diff --git a/model-00106-of-00142.safetensors b/model-00106-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9075a401f3286e0ce3b39185b347624c31112820 --- /dev/null +++ b/model-00106-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ba88672b2765b0846bf5974ffae6065287eb1762a1c4e3db61e57adbcd8fbe0 +size 4986018560 diff --git a/model-00107-of-00142.safetensors b/model-00107-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3726d36bdb6e014f44c3d41039e60e85ee75c38e --- /dev/null +++ b/model-00107-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:671c0031968e157269a26e5bb1362f95896c0e086df5886dd0fc3a1e1ae829a2 +size 4992949536 diff --git a/model-00108-of-00142.safetensors b/model-00108-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3efdb6eb68c726255701590c6c0c8b0f1e458742 --- /dev/null +++ b/model-00108-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d90d5ed1297a374597e0ae98cb5e8a917e15165c4d1a505f6c5afba616737c7d +size 4893306064 diff --git a/model-00109-of-00142.safetensors b/model-00109-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..354f5a66cc049db39fc953d5494c50ea081a2e81 --- /dev/null +++ b/model-00109-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f37aebc4e7ddb98adf24a0279410e1c6473feeccef6fd919af34e72d04b751ae +size 4991289440 diff --git a/model-00110-of-00142.safetensors b/model-00110-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4e8b2f09d271abc47a36240debda030f49a50efe --- /dev/null +++ b/model-00110-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:effc31ac270261c1c9d75e1e54cfabf4ca2f8d96d929e3e620296a4237603fbf +size 4992949592 diff --git a/model-00111-of-00142.safetensors b/model-00111-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1cdc5f61698db8f890b5e194e9ebee0ec1d1332b --- /dev/null +++ b/model-00111-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:514d25543d7ae1cd54d3285d2082fb7ad1d55bae7847fb4408ffce41f7078aac +size 4986018640 diff --git a/model-00112-of-00142.safetensors b/model-00112-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e60f5d844852ff2d56813bf391e123e80e336788 --- /dev/null +++ b/model-00112-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abe3e388e4f975b22938f2a601242394aded65424cca6b11807a2fc28c946b52 +size 4992949456 diff --git a/model-00113-of-00142.safetensors b/model-00113-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..79d3e4a62bfd6cdc21f27a785168d846da9473dc --- /dev/null +++ b/model-00113-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b1d2b86db2e0629b9545a854f73354c2abe88009155d321fc46ea5ab04981f8 +size 4992949592 diff --git a/model-00114-of-00142.safetensors b/model-00114-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f8a88657c8298d9c3e6d6db0bb8d4c019e373836 --- /dev/null +++ b/model-00114-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e333efa43a3afa4bb90f0cbf262e443ffe2e5772f3c4c928a1090ee0f91802e8 +size 4986018592 diff --git a/model-00115-of-00142.safetensors b/model-00115-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..56806cd24b711f05bb898ba54656441412deeac5 --- /dev/null +++ b/model-00115-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9351644dc6abe3b5ec9f8d65866459ea19fd297dbd08e7570425e09600aa9157 +size 4992949504 diff --git a/model-00116-of-00142.safetensors b/model-00116-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8425333c20e19d7f92f8da773f1350e3b50572a0 --- /dev/null +++ b/model-00116-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f4a6e75f3604d404ecddc0da1ff076b0c0f1ee4c52e1f4e0d9e0ac228c674dd +size 4992949600 diff --git a/model-00117-of-00142.safetensors b/model-00117-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..891c20604051a3c7a910818416692a0e5f4ac24f --- /dev/null +++ b/model-00117-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4868eab7066cbca4f9c06bd2f6529145d51a4dc7f9b2042eb48abdd38c3f5e9 +size 4986018528 diff --git a/model-00118-of-00142.safetensors b/model-00118-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ed217aa8c333ab9b1e224982d57d6abce6fa8cb2 --- /dev/null +++ b/model-00118-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de06133ec7af4dc88b268ac01740885d2f1a052692f550ebec71be128756904e +size 4992949560 diff --git a/model-00119-of-00142.safetensors b/model-00119-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d33878f1a66cae83246ed879e0fa5e2272e94c1b --- /dev/null +++ b/model-00119-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37238d22f13fddf84f4b7a4306849318911e903356d5bf9a5b2f231f1a235580 +size 4986018680 diff --git a/model-00120-of-00142.safetensors b/model-00120-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1f184d51ae5dfa16f8a5c2c6ce07fd915fed51ff --- /dev/null +++ b/model-00120-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e35c92f7217e8b4ec974df1788e6d88244fe5e45af6041be90b16f7b5238076 +size 4992949416 diff --git a/model-00121-of-00142.safetensors b/model-00121-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..68c1149806dd18f6bd185365e0dd8960b0bfc454 --- /dev/null +++ b/model-00121-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b047b13701edc0f346e9c56b06f77c1aabd3e4ae35ec6fa32058d0c0867bfce5 +size 4992949592 diff --git a/model-00122-of-00142.safetensors b/model-00122-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1f05cd843d238f9e6146239beab7a60598547062 --- /dev/null +++ b/model-00122-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bdb5d02274584b01dd2e73f8d2a3886612521c95b0abc59b838dd22ff6f36e9 +size 4986018632 diff --git a/model-00123-of-00142.safetensors b/model-00123-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bf46310ce21b50d274aded35365c4d725b5485d1 --- /dev/null +++ b/model-00123-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:664d95dba350c9c734a47440ffd5ae7229fbb1b2cdb549df68cb30c980c68843 +size 4992949464 diff --git a/model-00124-of-00142.safetensors b/model-00124-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..adbd7d7ee5fb03af6c008bf55cb72e988c841c9b --- /dev/null +++ b/model-00124-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728a700908b671c35fa5b438245e2104ceef8a57908836e340a33494303da195 +size 4992949592 diff --git a/model-00125-of-00142.safetensors b/model-00125-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c7c85a26d8ac3cbbf8b8180cdb6b7e0166020463 --- /dev/null +++ b/model-00125-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:165ccefe39003673e0189774ad8211fc29c223ed2ade483993c712243f1880dc +size 4986018576 diff --git a/model-00126-of-00142.safetensors b/model-00126-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1badd3507e41f4a94a2711d750a6ff28d23398b6 --- /dev/null +++ b/model-00126-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a6a796dddaea8e9553cc12912db1cffa4ebd6ba1f26e2d454dfe00f10736397 +size 4992949520 diff --git a/model-00127-of-00142.safetensors b/model-00127-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a9e98d8567c69ad307890dca6cbc5e4c381e5d52 --- /dev/null +++ b/model-00127-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ec37303d4c9d216846548c2a36732f0aa6b24b39c27eafc9c4812190153c69c +size 4992949616 diff --git a/model-00128-of-00142.safetensors b/model-00128-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7a193985fd38e9c85a4aed4e7398a470012e9e01 --- /dev/null +++ b/model-00128-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d6f4d56a903cb4b8f4f73741ac22ba3fac83c9785fe297f45d79fc5ff5cf743 +size 4986018504 diff --git a/model-00129-of-00142.safetensors b/model-00129-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cd18c4a2091a90ac951f0a5e4695f6f0720de8bf --- /dev/null +++ b/model-00129-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c6159866646e25849bb1e56c1b607253a7ba73f18ee2fddb98073427f46c6c8 +size 4992949568 diff --git a/model-00130-of-00142.safetensors b/model-00130-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c80eac404e960580109b09b8403438295b6d6358 --- /dev/null +++ b/model-00130-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:516b6dfb1185d24085602a02ada48c62a406446755e2990d0b28763360f9a62a +size 4986018664 diff --git a/model-00131-of-00142.safetensors b/model-00131-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..82709ca6ed1651575b48a112aa723df8a132fe1b --- /dev/null +++ b/model-00131-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa29064eb35922976c929dfdcb4270dce5dd8a84398a6637af62dbd2c7554104 +size 4992949432 diff --git a/model-00132-of-00142.safetensors b/model-00132-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cc40838be8e3a5b40f89a8566695ce6ea46f5544 --- /dev/null +++ b/model-00132-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec4c34f9115bb874763a067a655b4a2b6f532f58297f87488449ee2571d41885 +size 4992949592 diff --git a/model-00133-of-00142.safetensors b/model-00133-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9ba255ea43aad29cb95750fa395ca330b0b6337f --- /dev/null +++ b/model-00133-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3cb0b6c6b97557134d93d803f5c312bd5fad0825dfd2f13da12d512abf966bb +size 4986018616 diff --git a/model-00134-of-00142.safetensors b/model-00134-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d992915465590ef2fb2fcb71b3bcfb86fe6849c8 --- /dev/null +++ b/model-00134-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:058b9d99e27014babbb99d5f51d2972846d6fd1b6775375013a426003708832a +size 4992949488 diff --git a/model-00135-of-00142.safetensors b/model-00135-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..159c8f751309c5ec189d861df57fd5df7bf597f1 --- /dev/null +++ b/model-00135-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acd68bf1a48feb6d428cd64734f56a141d868ef4dc701b9525349e22cba80ea5 +size 4992949592 diff --git a/model-00136-of-00142.safetensors b/model-00136-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..76aaa13a8c8ae730853c8014e76fc0daf24fdb87 --- /dev/null +++ b/model-00136-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:256a5fe9283c7d29183cde70307e866a13bf91fc4388272a5c2c8c99f9309f3f +size 4986018568 diff --git a/model-00137-of-00142.safetensors b/model-00137-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e0b2e88d97485b33e31c515e78589576daf16486 --- /dev/null +++ b/model-00137-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6d99d338bd9086c9f2cd0bfa75533cde340580c24e8fdae082b9fa7a079a5f5 +size 4992949536 diff --git a/model-00138-of-00142.safetensors b/model-00138-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d91d07a1d5115b3c0b8102a0bc5a390ad91b9830 --- /dev/null +++ b/model-00138-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42d00b239e83b127aab734001faedac759f5feaa7ddf3b019eaea4a305691459 +size 4977221008 diff --git a/model-00139-of-00142.safetensors b/model-00139-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..282365f67fb364854713e3314cf0ec89f18827d3 --- /dev/null +++ b/model-00139-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:197c8fb56c9a29cc92dce850fce2fd04b4c1ac0c0afbb7ac9845210457f6ebcc +size 4986018336 diff --git a/model-00140-of-00142.safetensors b/model-00140-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b0aeb915a792d6f0e1d2ebb5dcdce7e8d77aab46 --- /dev/null +++ b/model-00140-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e66c06c8ca3cc47d68babd8f15ff857ad5c9a38e05b84c91c05d9f0fe096844f +size 4992949584 diff --git a/model-00141-of-00142.safetensors b/model-00141-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2ca7f140480f4db4840d381b9e27e6a99949a95e --- /dev/null +++ b/model-00141-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6efa8ee30eaaa3656f8874288f4f3dac56168822914d710a4d3417364aeb1e67 +size 4986018648 diff --git a/model-00142-of-00142.safetensors b/model-00142-of-00142.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..48aabeb055bbdc13c5d689cdfa2e26d7986d114e --- /dev/null +++ b/model-00142-of-00142.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df2d155c70dd975a5e8161c8b695c7209c6bdf2d18115f396d2fa6a3f171f28b +size 2182713568 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000000000000000000000000000000000000..41535813f4d94e3fa8a8a9bc6d3820e751428093 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,44197 @@ +{ + "metadata": { + "total_parameters": 352797814784, + "total_size": 705595686528 + }, + "weight_map": { + "lm_head.weight": "model-00142-of-00142.safetensors", + "model.embed_tokens.weight": "model-00001-of-00142.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-00142.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00142.safetensors", + "model.layers.0.self_attn.k_norm.weight": "model-00001-of-00142.safetensors", + "model.layers.0.self_attn.k_proj.bias": "model-00001-of-00142.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.0.self_attn.q_norm.weight": "model-00001-of-00142.safetensors", + "model.layers.0.self_attn.q_proj.bias": "model-00001-of-00142.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.0.self_attn.v_proj.bias": "model-00001-of-00142.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-00142.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00142.safetensors", + "model.layers.1.self_attn.k_norm.weight": "model-00001-of-00142.safetensors", + "model.layers.1.self_attn.k_proj.bias": "model-00001-of-00142.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.1.self_attn.q_norm.weight": "model-00001-of-00142.safetensors", + "model.layers.1.self_attn.q_proj.bias": "model-00001-of-00142.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.1.self_attn.v_proj.bias": "model-00001-of-00142.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.10.input_layernorm.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.0.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.0.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.0.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.1.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.1.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.1.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.10.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.10.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.10.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.100.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.100.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.100.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.101.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.101.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.101.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.102.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.102.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.102.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.103.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.103.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.103.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.104.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.104.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.104.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.105.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.105.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.105.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.106.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.106.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.106.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.107.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.107.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.107.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.108.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.108.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.108.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.109.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.109.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.109.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.11.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.11.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.11.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.110.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.110.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.110.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.111.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.111.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.111.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.112.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.112.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.112.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.113.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.113.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.113.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.114.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.114.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.114.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.115.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.115.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.115.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.116.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.116.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.116.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.117.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.117.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.117.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.118.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.118.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.118.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.119.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.119.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.119.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.12.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.12.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.12.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.120.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.120.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.120.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.121.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.121.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.121.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.122.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.122.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.122.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.123.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.123.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.123.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.124.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.124.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.124.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.125.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.125.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.125.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.126.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.126.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.126.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.127.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.127.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.127.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.128.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.128.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.128.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.129.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.129.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.129.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.13.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.13.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.13.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.130.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.130.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.130.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.131.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.131.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.131.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.132.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.132.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.132.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.133.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.133.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.133.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.134.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.134.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.134.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.135.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.135.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.135.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.136.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.136.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.136.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.137.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.137.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.137.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.138.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.138.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.138.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.139.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.139.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.139.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.14.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.14.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.14.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.140.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.140.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.140.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.141.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.141.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.141.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.142.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.142.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.142.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.143.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.143.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.143.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.144.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.144.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.144.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.145.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.145.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.145.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.146.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.146.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.146.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.147.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.147.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.147.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.148.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.148.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.148.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.149.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.149.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.149.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.15.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.15.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.15.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.150.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.150.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.150.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.151.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.151.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.151.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.152.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.152.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.152.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.153.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.153.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.153.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.154.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.154.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.154.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.155.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.155.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.155.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.156.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.156.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.156.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.157.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.157.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.157.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.158.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.158.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.158.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.159.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.159.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.159.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.experts.16.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.16.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.16.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.17.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.17.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.17.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.18.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.18.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.18.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.19.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.19.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.19.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.2.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.2.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.2.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.20.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.20.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.20.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.21.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.21.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.21.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.22.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.22.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.22.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.23.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.23.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.23.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.24.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.24.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.24.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.25.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.25.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.25.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.26.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.26.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.26.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.27.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.27.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.27.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.28.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.28.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.28.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.29.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.29.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.29.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.3.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.3.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.3.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.30.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.30.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.30.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.31.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.31.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.31.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.32.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.32.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.32.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.33.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.33.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.33.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.34.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.34.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.34.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.35.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.35.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.35.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.36.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.36.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.36.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.37.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.37.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.37.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.38.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.38.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.38.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.39.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.39.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.39.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.4.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.4.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.4.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.40.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.40.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.40.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.41.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.41.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.41.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.42.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.42.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.42.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.43.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.43.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.43.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.44.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.44.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.44.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.45.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.45.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.45.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.46.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.46.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.46.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.47.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.47.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.47.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.48.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.48.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.48.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.49.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.49.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.49.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.5.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.5.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.5.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.50.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.50.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.50.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.51.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.51.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.51.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.52.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.52.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.52.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.53.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.53.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.53.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.54.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.54.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.54.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.55.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.55.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.55.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.56.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.56.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.56.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.57.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.57.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.57.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.58.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.58.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.58.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.59.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.59.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.59.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.6.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.6.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.6.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.60.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.60.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.60.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.61.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.61.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.61.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.62.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.62.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.62.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.63.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.63.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.64.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.64.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.65.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.65.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.65.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.66.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.66.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.66.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.67.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.67.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.67.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.68.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.68.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.68.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.69.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.69.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.69.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.7.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.7.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.70.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.70.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.70.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.71.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.71.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.71.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.72.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.72.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.72.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.73.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.73.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.73.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.74.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.74.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.74.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.75.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.75.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.75.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.76.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.76.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.76.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.77.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.77.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.77.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.78.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.78.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.78.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.79.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.79.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.79.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.8.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.8.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.8.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.80.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.80.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.80.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.81.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.81.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.81.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.82.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.82.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.82.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.83.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.83.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.83.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.84.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.84.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.84.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.85.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.85.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.85.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.86.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.86.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.86.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.87.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.87.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.87.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.88.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.88.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.88.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.89.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.89.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.89.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.9.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.9.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.9.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.mlp.experts.90.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.90.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.90.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.91.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.91.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.91.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.92.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.92.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.92.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.93.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.93.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.93.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.94.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.94.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.94.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.95.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.95.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.95.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.96.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.96.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.96.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.97.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.97.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.97.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.98.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.98.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.98.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.99.down_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.99.gate_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.experts.99.up_proj.weight": "model-00013-of-00142.safetensors", + "model.layers.10.mlp.gate.e_score_correction_bias": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.gate.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.shared_experts.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.shared_experts.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.mlp.shared_experts.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00014-of-00142.safetensors", + "model.layers.10.self_attn.k_norm.weight": "model-00012-of-00142.safetensors", + "model.layers.10.self_attn.k_proj.bias": "model-00012-of-00142.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.self_attn.q_norm.weight": "model-00012-of-00142.safetensors", + "model.layers.10.self_attn.q_proj.bias": "model-00012-of-00142.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.10.self_attn.v_proj.bias": "model-00012-of-00142.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.11.input_layernorm.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.0.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.0.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.1.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.1.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.10.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.10.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.10.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.100.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.100.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.100.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.101.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.101.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.101.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.102.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.102.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.102.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.103.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.103.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.103.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.104.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.104.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.104.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.105.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.105.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.105.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.106.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.106.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.106.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.107.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.107.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.107.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.108.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.108.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.108.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.109.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.109.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.109.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.11.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.11.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.11.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.110.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.110.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.110.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.111.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.111.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.111.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.112.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.112.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.112.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.113.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.113.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.113.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.114.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.114.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.114.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.115.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.115.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.115.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.116.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.116.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.116.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.117.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.117.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.117.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.118.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.118.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.118.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.119.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.119.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.119.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.12.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.12.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.12.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.120.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.120.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.120.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.121.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.121.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.121.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.122.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.122.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.122.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.123.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.123.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.123.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.124.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.124.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.124.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.125.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.125.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.125.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.126.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.126.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.126.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.127.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.127.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.127.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.128.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.128.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.128.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.129.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.129.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.129.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.13.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.13.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.13.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.130.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.130.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.130.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.131.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.131.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.131.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.132.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.132.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.132.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.133.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.133.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.133.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.134.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.134.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.134.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.135.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.135.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.135.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.136.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.136.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.136.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.137.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.137.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.137.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.138.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.138.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.138.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.139.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.139.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.139.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.14.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.14.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.14.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.140.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.140.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.140.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.141.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.141.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.141.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.142.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.142.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.142.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.143.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.143.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.143.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.144.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.144.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.144.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.145.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.145.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.145.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.146.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.146.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.146.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.147.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.147.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.147.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.148.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.148.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.148.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.149.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.149.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.149.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.15.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.15.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.15.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.150.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.150.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.150.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.151.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.151.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.151.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.152.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.152.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.152.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.153.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.153.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.153.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.154.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.154.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.154.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.155.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.155.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.155.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.156.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.156.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.156.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.157.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.157.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.157.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.158.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.158.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.158.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.159.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.159.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.159.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.16.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.16.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.16.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.17.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.17.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.17.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.18.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.18.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.18.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.19.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.19.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.19.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.2.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.2.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.20.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.20.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.20.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.21.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.21.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.21.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.22.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.22.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.22.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.23.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.23.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.23.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.24.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.24.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.24.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.25.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.25.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.25.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.26.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.26.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.26.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.27.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.27.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.27.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.28.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.28.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.28.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.29.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.29.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.29.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.3.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.3.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.30.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.30.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.30.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.31.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.31.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.31.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.32.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.32.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.32.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.33.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.33.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.33.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.34.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.34.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.34.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.35.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.35.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.35.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.36.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.36.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.36.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.37.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.37.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.37.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.38.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.38.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.38.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.39.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.39.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.39.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.4.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.4.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.40.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.40.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.40.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.41.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.41.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.41.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.42.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.42.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.42.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.43.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.43.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.43.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.44.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.44.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.44.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.45.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.45.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.45.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.46.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.46.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.46.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.47.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.47.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.47.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.48.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.48.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.48.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.49.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.49.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.49.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.5.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.5.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.50.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.50.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.50.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.51.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.51.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.51.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.52.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.52.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.52.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.53.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.53.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.53.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.54.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.54.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.54.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.55.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.55.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.55.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.56.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.56.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.56.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.57.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.57.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.57.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.58.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.58.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.58.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.59.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.59.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.59.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.6.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.6.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.60.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.60.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.60.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.61.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.61.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.61.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.62.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.62.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.62.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.63.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.63.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.64.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.64.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.65.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.65.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.65.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.66.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.66.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.66.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.67.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.67.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.67.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.68.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.68.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.68.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.69.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.69.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.69.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.7.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.7.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.70.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.70.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.70.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.71.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.71.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.71.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.72.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.72.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.72.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.73.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.73.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.73.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.74.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.74.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.74.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.75.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.75.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.75.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.76.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.76.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.76.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.77.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.77.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.77.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.78.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.78.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.78.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.79.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.79.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.79.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.8.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.8.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.8.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.80.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.80.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.80.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.81.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.81.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.81.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.82.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.82.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.82.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.83.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.83.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.83.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.84.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.84.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.84.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.85.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.85.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.85.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.86.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.86.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.86.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.87.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.87.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.87.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.88.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.88.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.88.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.89.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.89.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.89.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.9.down_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.9.gate_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.9.up_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.mlp.experts.90.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.90.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.90.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.91.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.91.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.91.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.92.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.92.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.92.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.93.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.93.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.93.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.94.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.94.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.94.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.95.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.95.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.95.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.96.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.96.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.96.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.97.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.97.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.97.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.98.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.98.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.98.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.99.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.99.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.experts.99.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.gate.e_score_correction_bias": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.gate.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.shared_experts.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.shared_experts.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.mlp.shared_experts.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00015-of-00142.safetensors", + "model.layers.11.self_attn.k_norm.weight": "model-00014-of-00142.safetensors", + "model.layers.11.self_attn.k_proj.bias": "model-00014-of-00142.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.self_attn.q_norm.weight": "model-00014-of-00142.safetensors", + "model.layers.11.self_attn.q_proj.bias": "model-00014-of-00142.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.11.self_attn.v_proj.bias": "model-00014-of-00142.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00014-of-00142.safetensors", + "model.layers.12.input_layernorm.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.0.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.0.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.0.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.1.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.1.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.1.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.10.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.10.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.10.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.100.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.100.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.100.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.101.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.101.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.101.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.102.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.102.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.102.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.103.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.103.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.103.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.104.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.104.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.104.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.105.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.105.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.105.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.106.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.106.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.106.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.107.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.107.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.107.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.108.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.108.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.108.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.109.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.109.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.109.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.11.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.11.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.11.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.110.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.110.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.110.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.111.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.111.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.111.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.112.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.112.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.112.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.113.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.113.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.113.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.114.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.114.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.114.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.115.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.115.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.115.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.116.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.116.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.116.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.117.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.117.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.117.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.118.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.118.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.118.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.119.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.119.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.119.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.12.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.12.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.12.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.120.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.120.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.120.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.121.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.121.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.121.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.122.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.122.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.122.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.123.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.123.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.123.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.124.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.124.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.124.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.125.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.125.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.125.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.126.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.126.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.126.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.127.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.127.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.127.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.128.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.128.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.128.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.129.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.129.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.129.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.13.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.13.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.13.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.130.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.130.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.130.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.131.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.131.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.131.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.132.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.132.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.132.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.133.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.133.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.133.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.134.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.134.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.134.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.135.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.135.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.135.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.136.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.136.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.136.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.137.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.137.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.137.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.138.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.138.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.138.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.139.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.139.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.139.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.14.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.14.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.14.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.140.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.140.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.140.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.141.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.141.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.141.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.142.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.142.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.142.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.143.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.143.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.143.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.144.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.144.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.144.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.145.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.145.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.145.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.146.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.146.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.146.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.147.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.147.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.147.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.148.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.148.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.148.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.149.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.149.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.149.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.15.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.15.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.15.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.150.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.150.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.150.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.151.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.151.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.151.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.152.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.152.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.152.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.153.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.153.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.153.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.154.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.154.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.154.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.155.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.155.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.155.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.156.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.156.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.156.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.157.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.157.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.157.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.158.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.158.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.158.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.159.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.159.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.159.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.experts.16.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.16.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.16.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.17.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.17.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.17.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.18.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.18.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.18.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.19.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.19.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.19.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.2.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.2.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.2.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.20.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.20.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.20.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.21.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.21.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.21.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.22.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.22.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.22.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.23.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.23.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.23.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.24.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.24.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.24.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.25.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.25.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.25.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.26.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.26.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.26.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.27.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.27.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.27.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.28.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.28.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.28.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.29.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.29.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.29.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.3.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.3.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.3.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.30.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.30.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.30.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.31.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.31.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.31.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.32.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.32.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.32.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.33.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.33.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.33.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.34.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.34.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.34.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.35.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.35.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.35.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.36.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.36.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.36.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.37.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.37.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.37.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.38.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.38.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.38.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.39.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.39.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.39.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.4.down_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.4.gate_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.4.up_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.mlp.experts.40.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.40.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.40.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.41.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.41.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.41.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.42.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.42.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.42.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.43.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.43.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.43.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.44.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.44.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.44.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.45.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.45.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.45.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.46.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.46.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.46.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.47.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.47.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.47.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.48.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.48.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.48.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.49.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.49.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.49.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.5.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.5.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.5.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.50.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.50.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.50.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.51.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.51.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.51.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.52.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.52.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.52.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.53.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.53.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.53.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.54.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.54.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.54.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.55.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.55.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.55.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.56.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.56.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.56.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.57.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.57.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.57.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.58.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.58.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.58.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.59.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.59.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.59.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.6.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.6.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.6.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.60.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.60.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.60.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.61.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.61.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.61.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.62.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.62.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.62.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.63.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.63.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.64.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.64.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.65.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.65.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.65.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.66.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.66.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.66.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.67.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.67.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.67.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.68.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.68.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.68.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.69.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.69.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.69.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.7.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.7.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.70.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.70.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.70.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.71.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.71.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.71.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.72.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.72.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.72.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.73.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.73.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.73.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.74.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.74.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.74.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.75.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.75.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.75.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.76.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.76.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.76.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.77.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.77.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.77.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.78.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.78.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.78.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.79.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.79.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.79.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.8.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.8.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.8.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.80.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.80.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.80.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.81.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.81.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.81.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.82.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.82.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.82.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.83.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.83.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.83.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.84.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.84.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.84.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.85.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.85.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.85.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.86.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.86.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.86.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.87.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.87.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.87.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.88.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.88.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.88.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.89.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.89.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.89.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.9.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.9.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.9.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.90.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.90.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.90.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.91.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.91.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.91.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.92.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.92.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.92.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.93.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.93.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.93.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.94.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.94.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.94.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.95.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.95.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.95.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.96.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.96.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.96.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.97.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.97.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.97.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.98.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.98.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.98.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.99.down_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.99.gate_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.experts.99.up_proj.weight": "model-00016-of-00142.safetensors", + "model.layers.12.mlp.gate.e_score_correction_bias": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.gate.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.shared_experts.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.shared_experts.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.mlp.shared_experts.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00017-of-00142.safetensors", + "model.layers.12.self_attn.k_norm.weight": "model-00015-of-00142.safetensors", + "model.layers.12.self_attn.k_proj.bias": "model-00015-of-00142.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.self_attn.q_norm.weight": "model-00015-of-00142.safetensors", + "model.layers.12.self_attn.q_proj.bias": "model-00015-of-00142.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.12.self_attn.v_proj.bias": "model-00015-of-00142.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00015-of-00142.safetensors", + "model.layers.13.input_layernorm.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.0.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.0.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.1.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.1.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.10.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.10.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.10.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.100.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.100.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.100.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.101.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.101.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.101.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.102.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.102.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.102.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.103.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.103.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.103.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.104.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.104.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.104.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.105.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.105.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.105.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.106.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.106.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.106.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.107.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.107.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.107.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.108.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.108.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.108.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.109.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.109.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.109.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.11.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.11.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.11.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.110.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.110.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.110.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.111.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.111.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.111.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.112.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.112.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.112.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.113.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.113.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.113.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.114.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.114.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.114.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.115.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.115.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.115.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.116.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.116.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.116.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.117.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.117.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.117.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.118.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.118.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.118.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.119.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.119.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.119.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.12.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.12.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.12.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.120.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.120.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.120.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.121.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.121.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.121.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.122.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.122.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.122.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.123.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.123.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.123.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.124.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.124.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.124.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.125.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.125.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.125.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.126.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.126.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.126.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.127.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.127.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.127.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.128.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.128.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.128.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.129.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.129.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.129.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.13.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.13.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.13.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.130.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.130.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.130.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.131.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.131.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.131.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.132.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.132.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.132.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.133.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.133.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.133.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.134.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.134.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.134.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.135.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.135.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.135.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.136.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.136.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.136.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.137.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.137.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.137.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.138.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.138.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.138.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.139.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.139.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.139.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.14.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.14.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.14.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.140.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.140.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.140.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.141.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.141.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.141.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.142.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.142.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.142.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.143.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.143.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.143.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.144.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.144.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.144.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.145.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.145.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.145.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.146.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.146.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.146.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.147.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.147.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.147.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.148.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.148.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.148.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.149.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.149.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.149.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.15.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.15.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.15.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.150.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.150.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.150.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.151.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.151.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.151.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.152.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.152.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.152.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.153.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.153.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.153.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.154.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.154.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.154.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.155.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.155.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.155.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.156.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.156.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.156.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.157.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.157.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.157.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.158.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.158.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.158.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.159.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.159.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.159.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.experts.16.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.16.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.16.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.17.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.17.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.17.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.18.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.18.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.18.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.19.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.19.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.19.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.2.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.2.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.20.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.20.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.20.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.21.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.21.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.21.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.22.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.22.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.22.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.23.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.23.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.23.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.24.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.24.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.24.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.25.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.25.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.25.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.26.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.26.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.26.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.27.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.27.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.27.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.28.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.28.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.28.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.29.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.29.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.29.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.3.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.3.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.30.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.30.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.30.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.31.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.31.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.31.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.32.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.32.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.32.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.33.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.33.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.33.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.34.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.34.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.34.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.35.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.35.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.35.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.36.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.36.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.36.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.37.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.37.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.37.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.38.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.38.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.38.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.39.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.39.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.39.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.4.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.4.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.40.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.40.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.40.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.41.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.41.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.41.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.42.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.42.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.42.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.43.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.43.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.43.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.44.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.44.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.44.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.45.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.45.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.45.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.46.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.46.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.46.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.47.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.47.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.47.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.48.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.48.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.48.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.49.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.49.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.49.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.5.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.5.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.50.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.50.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.50.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.51.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.51.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.51.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.52.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.52.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.52.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.53.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.53.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.53.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.54.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.54.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.54.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.55.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.55.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.55.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.56.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.56.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.56.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.57.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.57.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.57.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.58.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.58.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.58.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.59.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.59.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.59.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.6.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.6.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.60.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.60.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.60.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.61.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.61.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.61.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.62.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.62.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.62.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.63.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.63.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.64.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.64.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.65.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.65.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.65.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.66.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.66.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.66.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.67.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.67.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.67.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.68.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.68.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.68.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.69.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.69.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.69.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.7.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.7.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.70.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.70.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.70.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.71.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.71.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.71.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.72.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.72.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.72.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.73.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.73.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.73.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.74.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.74.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.74.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.75.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.75.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.75.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.76.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.76.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.76.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.77.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.77.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.77.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.78.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.78.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.78.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.79.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.79.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.79.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.8.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.8.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.8.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.80.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.80.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.80.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.81.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.81.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.81.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.82.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.82.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.82.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.83.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.83.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.83.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.84.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.84.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.84.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.85.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.85.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.85.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.86.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.86.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.86.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.87.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.87.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.87.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.88.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.88.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.88.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.89.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.89.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.89.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.9.down_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.9.gate_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.9.up_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.mlp.experts.90.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.90.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.90.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.91.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.91.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.91.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.92.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.92.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.92.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.93.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.93.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.93.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.94.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.94.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.94.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.95.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.95.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.95.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.96.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.96.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.96.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.97.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.97.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.97.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.98.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.98.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.98.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.99.down_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.99.gate_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.experts.99.up_proj.weight": "model-00018-of-00142.safetensors", + "model.layers.13.mlp.gate.e_score_correction_bias": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.gate.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.shared_experts.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.shared_experts.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.mlp.shared_experts.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00019-of-00142.safetensors", + "model.layers.13.self_attn.k_norm.weight": "model-00017-of-00142.safetensors", + "model.layers.13.self_attn.k_proj.bias": "model-00017-of-00142.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.self_attn.q_norm.weight": "model-00017-of-00142.safetensors", + "model.layers.13.self_attn.q_proj.bias": "model-00017-of-00142.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.13.self_attn.v_proj.bias": "model-00017-of-00142.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00017-of-00142.safetensors", + "model.layers.14.input_layernorm.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.0.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.0.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.0.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.1.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.1.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.1.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.10.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.10.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.10.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.100.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.100.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.100.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.101.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.101.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.101.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.102.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.102.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.102.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.103.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.103.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.103.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.104.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.104.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.104.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.105.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.105.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.105.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.106.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.106.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.106.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.107.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.107.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.107.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.108.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.108.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.108.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.109.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.109.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.109.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.11.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.11.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.11.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.110.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.110.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.110.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.111.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.111.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.111.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.112.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.112.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.112.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.113.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.113.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.113.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.114.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.114.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.114.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.115.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.115.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.115.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.116.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.116.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.116.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.117.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.117.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.117.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.118.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.118.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.118.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.119.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.119.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.119.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.12.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.12.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.12.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.120.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.120.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.120.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.121.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.121.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.121.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.122.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.122.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.122.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.123.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.123.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.123.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.124.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.124.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.124.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.125.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.125.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.125.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.126.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.126.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.126.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.127.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.127.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.127.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.128.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.128.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.128.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.129.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.129.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.129.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.13.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.13.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.13.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.130.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.130.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.130.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.131.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.131.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.131.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.132.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.132.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.132.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.133.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.133.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.133.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.134.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.134.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.134.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.135.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.135.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.135.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.136.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.136.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.136.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.137.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.137.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.137.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.138.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.138.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.138.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.139.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.139.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.139.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.14.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.14.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.14.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.140.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.140.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.140.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.141.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.141.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.141.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.142.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.142.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.142.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.143.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.143.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.143.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.144.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.144.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.144.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.145.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.145.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.145.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.146.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.146.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.146.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.147.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.147.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.147.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.148.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.148.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.148.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.149.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.149.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.149.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.15.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.15.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.15.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.150.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.150.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.150.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.151.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.151.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.151.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.152.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.152.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.152.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.153.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.153.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.153.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.154.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.154.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.154.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.155.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.155.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.155.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.156.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.156.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.156.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.157.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.157.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.157.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.158.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.158.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.158.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.159.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.159.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.159.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.16.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.16.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.16.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.17.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.17.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.17.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.18.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.18.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.18.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.19.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.19.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.19.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.2.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.2.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.2.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.20.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.20.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.20.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.21.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.21.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.21.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.22.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.22.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.22.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.23.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.23.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.23.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.24.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.24.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.24.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.25.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.25.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.25.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.26.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.26.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.26.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.27.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.27.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.27.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.28.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.28.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.28.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.29.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.29.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.29.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.3.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.3.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.3.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.30.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.30.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.30.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.31.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.31.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.31.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.32.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.32.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.32.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.33.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.33.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.33.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.34.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.34.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.34.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.35.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.35.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.35.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.36.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.36.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.36.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.37.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.37.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.37.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.38.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.38.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.38.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.39.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.39.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.39.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.4.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.4.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.4.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.40.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.40.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.40.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.41.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.41.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.41.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.42.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.42.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.42.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.43.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.43.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.43.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.44.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.44.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.44.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.45.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.45.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.45.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.46.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.46.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.46.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.47.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.47.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.47.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.48.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.48.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.48.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.49.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.49.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.49.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.5.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.5.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.5.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.50.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.50.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.50.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.51.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.51.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.51.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.52.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.52.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.52.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.53.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.53.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.53.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.54.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.54.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.54.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.55.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.55.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.55.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.56.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.56.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.56.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.57.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.57.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.57.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.58.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.58.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.58.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.59.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.59.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.59.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.6.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.6.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.6.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.60.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.60.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.60.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.61.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.61.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.61.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.62.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.62.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.62.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.63.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.63.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.64.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.64.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.65.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.65.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.65.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.66.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.66.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.66.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.67.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.67.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.67.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.68.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.68.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.68.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.69.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.69.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.69.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.7.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.7.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.70.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.70.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.70.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.71.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.71.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.71.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.72.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.72.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.72.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.73.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.73.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.73.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.74.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.74.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.74.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.75.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.75.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.75.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.76.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.76.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.76.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.77.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.77.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.77.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.78.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.78.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.78.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.79.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.79.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.79.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.8.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.8.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.8.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.80.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.80.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.80.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.81.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.81.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.81.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.82.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.82.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.82.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.83.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.83.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.83.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.84.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.84.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.84.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.85.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.85.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.85.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.86.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.86.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.86.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.87.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.87.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.87.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.88.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.88.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.88.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.89.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.89.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.89.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.9.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.9.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.9.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.90.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.90.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.90.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.91.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.91.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.91.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.92.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.92.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.92.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.93.down_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.93.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.93.up_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.94.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.94.gate_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.mlp.experts.94.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.95.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.95.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.95.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.96.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.96.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.96.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.97.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.97.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.97.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.98.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.98.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.98.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.99.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.99.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.experts.99.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.gate.e_score_correction_bias": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.gate.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.shared_experts.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.shared_experts.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.mlp.shared_experts.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00020-of-00142.safetensors", + "model.layers.14.self_attn.k_norm.weight": "model-00019-of-00142.safetensors", + "model.layers.14.self_attn.k_proj.bias": "model-00019-of-00142.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.self_attn.q_norm.weight": "model-00019-of-00142.safetensors", + "model.layers.14.self_attn.q_proj.bias": "model-00019-of-00142.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.14.self_attn.v_proj.bias": "model-00019-of-00142.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00019-of-00142.safetensors", + "model.layers.15.input_layernorm.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.0.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.0.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.1.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.1.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.10.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.10.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.10.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.100.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.100.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.100.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.101.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.101.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.101.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.102.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.102.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.102.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.103.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.103.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.103.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.104.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.104.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.104.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.105.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.105.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.105.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.106.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.106.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.106.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.107.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.107.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.107.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.108.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.108.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.108.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.109.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.109.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.109.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.11.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.11.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.11.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.110.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.110.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.110.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.111.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.111.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.111.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.112.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.112.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.112.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.113.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.113.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.113.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.114.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.114.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.114.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.115.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.115.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.115.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.116.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.116.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.116.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.117.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.117.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.117.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.118.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.118.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.118.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.119.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.119.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.119.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.12.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.12.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.12.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.120.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.120.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.120.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.121.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.121.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.121.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.122.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.122.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.122.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.123.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.123.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.123.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.124.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.124.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.124.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.125.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.125.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.125.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.126.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.126.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.126.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.127.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.127.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.127.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.128.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.128.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.128.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.129.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.129.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.129.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.13.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.13.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.13.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.130.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.130.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.130.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.131.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.131.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.131.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.132.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.132.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.132.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.133.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.133.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.133.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.134.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.134.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.134.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.135.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.135.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.135.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.136.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.136.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.136.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.137.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.137.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.137.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.138.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.138.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.138.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.139.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.139.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.139.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.14.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.14.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.14.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.140.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.140.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.140.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.141.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.141.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.141.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.142.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.142.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.142.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.143.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.143.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.143.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.144.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.144.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.144.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.145.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.145.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.145.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.146.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.146.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.146.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.147.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.147.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.147.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.148.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.148.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.148.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.149.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.149.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.149.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.15.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.15.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.15.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.150.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.150.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.150.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.151.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.151.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.151.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.152.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.152.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.152.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.153.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.153.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.153.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.154.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.154.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.154.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.155.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.155.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.155.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.156.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.156.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.156.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.157.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.157.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.157.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.158.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.158.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.158.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.159.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.159.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.159.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.experts.16.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.16.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.16.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.17.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.17.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.17.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.18.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.18.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.18.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.19.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.19.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.19.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.2.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.2.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.20.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.20.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.20.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.21.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.21.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.21.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.22.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.22.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.22.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.23.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.23.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.23.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.24.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.24.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.24.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.25.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.25.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.25.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.26.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.26.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.26.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.27.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.27.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.27.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.28.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.28.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.28.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.29.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.29.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.29.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.3.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.3.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.30.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.30.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.30.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.31.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.31.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.31.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.32.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.32.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.32.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.33.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.33.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.33.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.34.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.34.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.34.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.35.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.35.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.35.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.36.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.36.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.36.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.37.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.37.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.37.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.38.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.38.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.38.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.39.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.39.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.39.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.4.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.4.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.40.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.40.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.40.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.41.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.41.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.41.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.42.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.42.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.42.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.43.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.43.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.43.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.44.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.44.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.44.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.45.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.45.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.45.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.46.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.46.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.46.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.47.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.47.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.47.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.48.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.48.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.48.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.49.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.49.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.49.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.5.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.5.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.50.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.50.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.50.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.51.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.51.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.51.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.52.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.52.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.52.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.53.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.53.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.53.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.54.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.54.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.54.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.55.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.55.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.55.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.56.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.56.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.56.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.57.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.57.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.57.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.58.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.58.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.58.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.59.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.59.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.59.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.6.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.6.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.60.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.60.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.60.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.61.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.61.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.61.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.62.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.62.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.62.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.63.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.63.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.64.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.64.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.65.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.65.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.65.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.66.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.66.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.66.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.67.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.67.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.67.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.68.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.68.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.68.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.69.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.69.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.69.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.7.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.7.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.70.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.70.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.70.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.71.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.71.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.71.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.72.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.72.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.72.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.73.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.73.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.73.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.74.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.74.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.74.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.75.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.75.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.75.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.76.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.76.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.76.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.77.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.77.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.77.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.78.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.78.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.78.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.79.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.79.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.79.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.8.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.8.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.8.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.80.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.80.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.80.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.81.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.81.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.81.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.82.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.82.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.82.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.83.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.83.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.83.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.84.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.84.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.84.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.85.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.85.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.85.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.86.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.86.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.86.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.87.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.87.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.87.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.88.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.88.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.88.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.89.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.89.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.89.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.9.down_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.9.gate_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.9.up_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.mlp.experts.90.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.90.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.90.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.91.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.91.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.91.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.92.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.92.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.92.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.93.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.93.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.93.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.94.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.94.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.94.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.95.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.95.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.95.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.96.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.96.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.96.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.97.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.97.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.97.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.98.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.98.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.98.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.99.down_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.99.gate_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.experts.99.up_proj.weight": "model-00021-of-00142.safetensors", + "model.layers.15.mlp.gate.e_score_correction_bias": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.gate.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.shared_experts.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.shared_experts.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.mlp.shared_experts.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00022-of-00142.safetensors", + "model.layers.15.self_attn.k_norm.weight": "model-00020-of-00142.safetensors", + "model.layers.15.self_attn.k_proj.bias": "model-00020-of-00142.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.self_attn.q_norm.weight": "model-00020-of-00142.safetensors", + "model.layers.15.self_attn.q_proj.bias": "model-00020-of-00142.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.15.self_attn.v_proj.bias": "model-00020-of-00142.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00020-of-00142.safetensors", + "model.layers.16.input_layernorm.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.0.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.0.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.0.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.1.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.1.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.1.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.10.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.10.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.10.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.100.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.100.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.100.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.101.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.101.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.101.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.102.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.102.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.102.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.103.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.103.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.103.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.104.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.104.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.104.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.105.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.105.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.105.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.106.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.106.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.106.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.107.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.107.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.107.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.108.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.108.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.108.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.109.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.109.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.109.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.11.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.11.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.11.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.110.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.110.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.110.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.111.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.111.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.111.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.112.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.112.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.112.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.113.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.113.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.113.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.114.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.114.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.114.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.115.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.115.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.115.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.116.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.116.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.116.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.117.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.117.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.117.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.118.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.118.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.118.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.119.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.119.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.119.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.12.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.12.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.12.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.120.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.120.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.120.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.121.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.121.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.121.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.122.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.122.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.122.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.123.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.123.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.123.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.124.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.124.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.124.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.125.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.125.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.125.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.126.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.126.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.126.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.127.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.127.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.127.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.128.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.128.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.128.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.129.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.129.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.129.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.13.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.13.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.13.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.130.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.130.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.130.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.131.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.131.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.131.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.132.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.132.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.132.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.133.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.133.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.133.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.134.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.134.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.134.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.135.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.135.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.135.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.136.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.136.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.136.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.137.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.137.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.137.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.138.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.138.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.138.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.139.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.139.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.139.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.14.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.14.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.14.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.140.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.140.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.140.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.141.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.141.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.141.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.142.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.142.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.142.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.143.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.143.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.143.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.144.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.144.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.144.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.145.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.145.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.145.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.146.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.146.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.146.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.147.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.147.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.147.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.148.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.148.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.148.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.149.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.149.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.149.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.15.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.15.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.15.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.150.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.150.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.150.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.151.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.151.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.151.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.152.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.152.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.152.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.153.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.153.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.153.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.154.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.154.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.154.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.155.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.155.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.155.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.156.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.156.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.156.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.157.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.157.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.157.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.158.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.158.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.158.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.159.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.159.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.159.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.16.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.16.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.16.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.17.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.17.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.17.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.18.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.18.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.18.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.19.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.19.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.19.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.2.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.2.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.2.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.20.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.20.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.20.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.21.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.21.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.21.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.22.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.22.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.22.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.23.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.23.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.23.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.24.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.24.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.24.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.25.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.25.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.25.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.26.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.26.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.26.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.27.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.27.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.27.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.28.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.28.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.28.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.29.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.29.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.29.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.3.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.3.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.3.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.30.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.30.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.30.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.31.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.31.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.31.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.32.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.32.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.32.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.33.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.33.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.33.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.34.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.34.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.34.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.35.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.35.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.35.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.36.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.36.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.36.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.37.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.37.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.37.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.38.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.38.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.38.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.39.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.39.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.39.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.4.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.4.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.4.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.40.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.40.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.40.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.41.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.41.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.41.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.42.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.42.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.42.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.43.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.43.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.43.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.44.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.44.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.44.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.45.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.45.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.45.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.46.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.46.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.46.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.47.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.47.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.47.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.48.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.48.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.48.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.49.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.49.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.49.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.5.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.5.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.5.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.50.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.50.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.50.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.51.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.51.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.51.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.52.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.52.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.52.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.53.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.53.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.53.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.54.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.54.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.54.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.55.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.55.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.55.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.56.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.56.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.56.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.57.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.57.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.57.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.58.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.58.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.58.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.59.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.59.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.59.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.6.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.6.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.6.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.60.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.60.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.60.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.61.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.61.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.61.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.62.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.62.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.62.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.63.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.63.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.64.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.64.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.65.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.65.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.65.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.66.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.66.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.66.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.67.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.67.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.67.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.68.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.68.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.68.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.69.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.69.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.69.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.7.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.7.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.70.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.70.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.70.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.71.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.71.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.71.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.72.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.72.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.72.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.73.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.73.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.73.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.74.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.74.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.74.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.75.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.75.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.75.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.76.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.76.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.76.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.77.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.77.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.77.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.78.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.78.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.78.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.79.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.79.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.79.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.8.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.8.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.8.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.80.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.80.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.80.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.81.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.81.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.81.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.82.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.82.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.82.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.83.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.83.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.83.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.84.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.84.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.84.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.85.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.85.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.85.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.86.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.86.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.86.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.87.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.87.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.87.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.88.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.88.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.88.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.89.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.89.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.89.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.9.down_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.9.gate_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.9.up_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.mlp.experts.90.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.90.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.90.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.91.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.91.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.91.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.92.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.92.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.92.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.93.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.93.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.93.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.94.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.94.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.94.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.95.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.95.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.95.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.96.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.96.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.96.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.97.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.97.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.97.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.98.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.98.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.98.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.99.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.99.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.experts.99.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.gate.e_score_correction_bias": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.gate.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.shared_experts.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.shared_experts.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.mlp.shared_experts.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00023-of-00142.safetensors", + "model.layers.16.self_attn.k_norm.weight": "model-00022-of-00142.safetensors", + "model.layers.16.self_attn.k_proj.bias": "model-00022-of-00142.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.self_attn.q_norm.weight": "model-00022-of-00142.safetensors", + "model.layers.16.self_attn.q_proj.bias": "model-00022-of-00142.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.16.self_attn.v_proj.bias": "model-00022-of-00142.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00022-of-00142.safetensors", + "model.layers.17.input_layernorm.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.0.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.0.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.1.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.1.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.10.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.10.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.10.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.100.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.100.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.100.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.101.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.101.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.101.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.102.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.102.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.102.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.103.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.103.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.103.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.104.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.104.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.104.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.105.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.105.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.105.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.106.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.106.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.106.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.107.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.107.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.107.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.108.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.108.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.108.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.109.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.109.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.109.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.11.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.11.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.11.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.110.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.110.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.110.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.111.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.111.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.111.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.112.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.112.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.112.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.113.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.113.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.113.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.114.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.114.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.114.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.115.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.115.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.115.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.116.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.116.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.116.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.117.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.117.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.117.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.118.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.118.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.118.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.119.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.119.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.119.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.12.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.12.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.12.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.120.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.120.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.120.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.121.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.121.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.121.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.122.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.122.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.122.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.123.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.123.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.123.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.124.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.124.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.124.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.125.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.125.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.125.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.126.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.126.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.126.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.127.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.127.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.127.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.128.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.128.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.128.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.129.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.129.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.129.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.13.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.13.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.13.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.130.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.130.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.130.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.131.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.131.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.131.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.132.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.132.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.132.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.133.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.133.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.133.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.134.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.134.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.134.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.135.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.135.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.135.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.136.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.136.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.136.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.137.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.137.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.137.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.138.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.138.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.138.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.139.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.139.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.139.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.14.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.14.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.14.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.140.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.140.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.140.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.141.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.141.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.141.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.142.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.142.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.142.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.143.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.143.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.143.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.144.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.144.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.144.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.145.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.145.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.145.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.146.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.146.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.146.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.147.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.147.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.147.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.148.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.148.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.148.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.149.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.149.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.149.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.15.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.15.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.15.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.150.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.150.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.150.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.151.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.151.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.151.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.152.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.152.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.152.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.153.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.153.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.153.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.154.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.154.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.154.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.155.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.155.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.155.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.156.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.156.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.156.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.157.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.157.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.157.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.158.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.158.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.158.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.159.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.159.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.159.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.experts.16.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.16.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.16.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.17.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.17.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.17.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.18.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.18.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.18.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.19.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.19.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.19.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.2.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.2.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.20.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.20.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.20.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.21.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.21.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.21.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.22.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.22.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.22.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.23.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.23.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.23.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.24.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.24.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.24.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.25.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.25.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.25.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.26.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.26.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.26.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.27.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.27.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.27.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.28.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.28.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.28.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.29.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.29.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.29.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.3.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.3.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.30.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.30.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.30.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.31.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.31.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.31.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.32.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.32.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.32.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.33.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.33.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.33.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.34.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.34.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.34.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.35.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.35.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.35.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.36.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.36.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.36.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.37.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.37.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.37.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.38.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.38.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.38.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.39.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.39.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.39.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.4.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.4.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.40.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.40.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.40.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.41.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.41.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.41.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.42.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.42.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.42.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.43.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.43.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.43.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.44.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.44.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.44.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.45.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.45.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.45.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.46.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.46.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.46.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.47.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.47.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.47.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.48.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.48.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.48.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.49.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.49.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.49.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.5.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.5.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.50.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.50.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.50.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.51.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.51.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.51.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.52.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.52.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.52.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.53.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.53.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.53.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.54.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.54.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.54.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.55.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.55.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.55.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.56.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.56.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.56.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.57.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.57.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.57.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.58.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.58.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.58.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.59.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.59.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.59.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.6.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.6.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.60.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.60.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.60.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.61.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.61.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.61.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.62.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.62.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.62.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.63.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.63.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.64.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.64.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.65.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.65.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.65.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.66.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.66.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.66.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.67.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.67.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.67.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.68.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.68.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.68.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.69.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.69.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.69.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.7.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.7.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.70.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.70.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.70.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.71.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.71.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.71.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.72.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.72.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.72.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.73.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.73.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.73.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.74.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.74.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.74.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.75.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.75.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.75.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.76.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.76.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.76.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.77.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.77.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.77.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.78.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.78.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.78.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.79.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.79.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.79.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.8.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.8.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.8.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.80.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.80.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.80.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.81.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.81.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.81.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.82.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.82.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.82.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.83.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.83.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.83.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.84.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.84.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.84.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.85.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.85.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.85.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.86.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.86.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.86.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.87.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.87.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.87.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.88.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.88.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.88.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.89.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.89.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.89.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.9.down_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.9.gate_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.9.up_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.mlp.experts.90.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.90.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.90.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.91.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.91.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.91.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.92.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.92.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.92.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.93.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.93.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.93.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.94.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.94.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.94.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.95.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.95.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.95.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.96.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.96.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.96.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.97.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.97.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.97.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.98.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.98.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.98.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.99.down_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.99.gate_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.experts.99.up_proj.weight": "model-00024-of-00142.safetensors", + "model.layers.17.mlp.gate.e_score_correction_bias": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.gate.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.shared_experts.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.shared_experts.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.mlp.shared_experts.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00025-of-00142.safetensors", + "model.layers.17.self_attn.k_norm.weight": "model-00023-of-00142.safetensors", + "model.layers.17.self_attn.k_proj.bias": "model-00023-of-00142.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.self_attn.q_norm.weight": "model-00023-of-00142.safetensors", + "model.layers.17.self_attn.q_proj.bias": "model-00023-of-00142.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.17.self_attn.v_proj.bias": "model-00023-of-00142.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00023-of-00142.safetensors", + "model.layers.18.input_layernorm.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.0.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.0.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.0.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.1.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.1.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.1.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.10.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.10.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.10.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.100.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.100.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.100.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.101.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.101.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.101.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.102.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.102.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.102.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.103.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.103.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.103.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.104.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.104.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.104.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.105.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.105.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.105.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.106.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.106.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.106.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.107.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.107.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.107.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.108.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.108.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.108.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.109.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.109.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.109.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.11.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.11.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.11.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.110.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.110.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.110.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.111.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.111.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.111.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.112.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.112.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.112.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.113.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.113.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.113.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.114.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.114.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.114.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.115.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.115.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.115.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.116.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.116.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.116.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.117.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.117.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.117.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.118.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.118.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.118.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.119.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.119.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.119.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.12.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.12.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.12.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.120.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.120.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.120.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.121.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.121.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.121.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.122.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.122.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.122.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.123.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.123.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.123.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.124.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.124.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.124.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.125.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.125.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.125.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.126.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.126.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.126.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.127.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.127.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.127.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.128.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.128.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.128.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.129.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.129.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.129.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.13.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.13.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.13.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.130.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.130.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.130.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.131.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.131.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.131.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.132.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.132.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.132.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.133.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.133.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.133.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.134.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.134.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.134.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.135.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.135.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.135.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.136.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.136.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.136.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.137.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.137.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.137.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.138.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.138.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.138.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.139.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.139.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.139.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.14.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.14.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.14.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.140.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.140.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.140.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.141.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.141.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.141.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.142.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.142.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.142.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.143.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.143.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.143.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.144.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.144.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.144.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.145.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.145.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.145.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.146.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.146.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.146.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.147.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.147.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.147.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.148.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.148.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.148.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.149.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.149.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.149.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.15.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.15.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.15.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.150.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.150.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.150.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.151.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.151.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.151.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.152.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.152.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.152.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.153.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.153.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.153.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.154.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.154.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.154.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.155.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.155.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.155.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.156.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.156.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.156.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.157.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.157.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.157.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.158.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.158.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.158.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.159.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.159.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.159.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.16.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.16.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.16.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.17.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.17.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.17.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.18.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.18.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.18.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.19.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.19.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.19.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.2.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.2.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.2.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.20.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.20.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.20.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.21.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.21.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.21.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.22.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.22.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.22.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.23.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.23.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.23.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.24.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.24.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.24.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.25.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.25.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.25.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.26.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.26.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.26.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.27.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.27.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.27.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.28.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.28.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.28.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.29.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.29.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.29.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.3.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.3.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.3.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.30.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.30.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.30.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.31.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.31.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.31.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.32.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.32.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.32.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.33.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.33.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.33.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.34.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.34.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.34.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.35.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.35.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.35.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.36.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.36.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.36.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.37.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.37.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.37.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.38.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.38.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.38.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.39.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.39.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.39.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.4.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.4.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.4.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.40.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.40.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.40.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.41.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.41.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.41.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.42.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.42.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.42.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.43.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.43.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.43.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.44.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.44.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.44.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.45.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.45.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.45.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.46.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.46.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.46.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.47.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.47.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.47.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.48.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.48.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.48.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.49.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.49.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.49.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.5.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.5.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.5.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.50.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.50.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.50.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.51.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.51.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.51.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.52.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.52.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.52.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.53.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.53.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.53.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.54.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.54.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.54.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.55.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.55.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.55.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.56.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.56.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.56.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.57.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.57.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.57.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.58.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.58.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.58.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.59.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.59.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.59.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.6.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.6.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.6.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.60.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.60.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.60.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.61.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.61.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.61.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.62.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.62.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.62.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.63.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.63.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.64.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.64.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.65.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.65.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.65.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.66.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.66.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.66.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.67.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.67.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.67.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.68.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.68.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.68.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.69.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.69.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.69.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.7.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.7.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.70.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.70.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.70.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.71.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.71.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.71.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.72.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.72.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.72.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.73.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.73.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.73.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.74.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.74.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.74.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.75.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.75.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.75.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.76.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.76.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.76.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.77.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.77.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.77.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.78.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.78.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.78.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.79.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.79.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.79.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.8.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.8.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.8.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.80.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.80.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.80.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.81.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.81.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.81.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.82.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.82.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.82.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.83.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.83.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.83.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.84.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.84.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.84.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.85.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.85.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.85.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.86.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.86.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.86.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.87.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.87.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.87.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.88.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.88.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.88.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.89.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.89.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.89.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.9.down_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.9.gate_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.9.up_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.mlp.experts.90.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.90.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.90.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.91.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.91.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.91.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.92.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.92.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.92.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.93.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.93.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.93.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.94.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.94.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.94.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.95.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.95.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.95.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.96.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.96.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.96.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.97.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.97.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.97.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.98.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.98.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.98.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.99.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.99.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.experts.99.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.gate.e_score_correction_bias": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.gate.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.shared_experts.down_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.shared_experts.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.mlp.shared_experts.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00026-of-00142.safetensors", + "model.layers.18.self_attn.k_norm.weight": "model-00025-of-00142.safetensors", + "model.layers.18.self_attn.k_proj.bias": "model-00025-of-00142.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.self_attn.q_norm.weight": "model-00025-of-00142.safetensors", + "model.layers.18.self_attn.q_proj.bias": "model-00025-of-00142.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.18.self_attn.v_proj.bias": "model-00025-of-00142.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00025-of-00142.safetensors", + "model.layers.19.input_layernorm.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.0.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.19.mlp.experts.0.up_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.19.mlp.experts.1.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.1.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.10.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.10.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.10.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.100.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.100.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.100.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.101.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.101.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.101.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.102.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.102.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.102.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.103.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.103.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.103.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.104.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.104.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.104.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.105.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.105.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.105.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.106.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.106.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.106.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.107.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.107.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.107.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.108.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.108.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.108.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.109.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.109.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.109.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.11.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.11.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.11.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.110.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.110.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.110.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.111.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.111.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.111.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.112.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.112.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.112.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.113.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.113.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.113.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.114.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.114.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.114.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.115.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.115.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.115.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.116.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.116.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.116.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.117.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.117.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.117.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.118.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.118.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.118.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.119.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.119.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.119.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.12.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.12.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.12.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.120.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.120.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.120.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.121.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.121.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.121.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.122.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.122.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.122.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.123.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.123.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.123.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.124.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.124.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.124.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.125.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.125.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.125.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.126.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.126.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.126.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.127.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.127.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.127.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.128.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.128.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.128.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.129.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.129.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.129.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.13.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.13.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.13.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.130.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.130.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.130.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.131.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.131.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.131.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.132.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.132.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.132.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.133.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.133.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.133.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.134.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.134.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.134.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.135.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.135.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.135.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.136.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.136.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.136.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.137.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.137.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.137.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.138.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.138.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.138.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.139.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.139.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.139.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.14.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.14.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.14.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.140.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.140.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.140.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.141.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.141.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.141.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.142.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.142.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.142.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.143.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.143.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.143.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.144.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.144.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.144.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.145.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.145.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.145.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.146.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.146.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.146.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.147.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.147.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.147.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.148.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.148.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.148.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.149.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.149.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.149.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.15.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.15.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.15.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.150.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.150.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.150.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.151.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.151.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.151.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.152.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.152.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.152.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.153.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.153.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.153.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.154.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.154.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.154.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.155.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.155.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.155.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.156.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.156.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.156.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.157.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.157.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.157.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.158.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.158.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.158.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.159.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.159.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.159.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.experts.16.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.16.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.16.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.17.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.17.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.17.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.18.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.18.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.18.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.19.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.19.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.19.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.2.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.2.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.20.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.20.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.20.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.21.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.21.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.21.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.22.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.22.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.22.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.23.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.23.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.23.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.24.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.24.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.24.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.25.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.25.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.25.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.26.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.26.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.26.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.27.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.27.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.27.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.28.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.28.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.28.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.29.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.29.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.29.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.3.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.3.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.30.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.30.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.30.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.31.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.31.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.31.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.32.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.32.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.32.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.33.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.33.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.33.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.34.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.34.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.34.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.35.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.35.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.35.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.36.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.36.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.36.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.37.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.37.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.37.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.38.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.38.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.38.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.39.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.39.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.39.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.4.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.4.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.40.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.40.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.40.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.41.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.41.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.41.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.42.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.42.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.42.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.43.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.43.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.43.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.44.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.44.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.44.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.45.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.45.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.45.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.46.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.46.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.46.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.47.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.47.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.47.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.48.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.48.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.48.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.49.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.49.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.49.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.5.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.5.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.50.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.50.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.50.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.51.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.51.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.51.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.52.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.52.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.52.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.53.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.53.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.53.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.54.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.54.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.54.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.55.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.55.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.55.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.56.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.56.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.56.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.57.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.57.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.57.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.58.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.58.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.58.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.59.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.59.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.59.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.6.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.6.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.60.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.60.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.60.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.61.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.61.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.61.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.62.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.62.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.62.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.63.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.63.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.64.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.64.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.65.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.65.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.65.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.66.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.66.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.66.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.67.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.67.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.67.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.68.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.68.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.68.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.69.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.69.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.69.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.7.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.7.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.70.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.70.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.70.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.71.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.71.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.71.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.72.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.72.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.72.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.73.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.73.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.73.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.74.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.74.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.74.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.75.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.75.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.75.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.76.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.76.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.76.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.77.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.77.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.77.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.78.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.78.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.78.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.79.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.79.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.79.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.8.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.8.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.8.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.80.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.80.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.80.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.81.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.81.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.81.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.82.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.82.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.82.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.83.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.83.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.83.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.84.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.84.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.84.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.85.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.85.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.85.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.86.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.86.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.86.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.87.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.87.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.87.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.88.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.88.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.88.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.89.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.89.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.89.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.9.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.9.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.9.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.90.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.90.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.90.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.91.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.91.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.91.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.92.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.92.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.92.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.93.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.93.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.93.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.94.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.94.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.94.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.95.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.95.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.95.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.96.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.96.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.96.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.97.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.97.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.97.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.98.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.98.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.98.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.99.down_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.99.gate_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.experts.99.up_proj.weight": "model-00027-of-00142.safetensors", + "model.layers.19.mlp.gate.e_score_correction_bias": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.gate.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.shared_experts.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.shared_experts.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.mlp.shared_experts.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00028-of-00142.safetensors", + "model.layers.19.self_attn.k_norm.weight": "model-00026-of-00142.safetensors", + "model.layers.19.self_attn.k_proj.bias": "model-00026-of-00142.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.19.self_attn.q_norm.weight": "model-00026-of-00142.safetensors", + "model.layers.19.self_attn.q_proj.bias": "model-00026-of-00142.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.19.self_attn.v_proj.bias": "model-00026-of-00142.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00026-of-00142.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-00142.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00142.safetensors", + "model.layers.2.self_attn.k_norm.weight": "model-00001-of-00142.safetensors", + "model.layers.2.self_attn.k_proj.bias": "model-00001-of-00142.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.2.self_attn.q_norm.weight": "model-00001-of-00142.safetensors", + "model.layers.2.self_attn.q_proj.bias": "model-00001-of-00142.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.2.self_attn.v_proj.bias": "model-00001-of-00142.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.20.input_layernorm.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.0.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.0.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.0.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.1.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.1.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.1.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.10.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.10.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.10.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.100.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.100.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.100.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.101.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.101.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.101.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.102.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.102.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.102.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.103.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.103.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.103.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.104.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.104.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.104.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.105.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.105.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.105.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.106.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.106.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.106.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.107.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.107.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.107.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.108.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.108.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.108.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.109.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.109.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.109.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.11.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.11.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.11.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.110.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.110.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.110.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.111.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.111.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.111.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.112.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.112.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.112.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.113.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.113.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.113.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.114.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.114.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.114.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.115.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.115.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.115.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.116.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.116.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.116.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.117.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.117.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.117.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.118.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.118.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.118.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.119.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.119.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.119.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.12.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.12.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.12.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.120.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.120.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.120.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.121.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.121.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.121.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.122.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.122.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.122.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.123.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.123.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.123.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.124.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.124.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.124.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.125.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.125.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.125.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.126.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.126.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.126.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.127.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.127.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.127.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.128.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.128.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.128.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.129.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.129.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.129.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.13.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.13.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.13.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.130.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.130.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.130.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.131.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.131.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.131.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.132.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.132.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.132.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.133.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.133.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.133.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.134.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.134.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.134.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.135.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.135.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.135.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.136.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.136.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.136.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.137.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.137.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.137.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.138.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.138.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.138.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.139.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.139.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.139.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.14.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.14.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.14.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.140.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.140.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.140.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.141.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.141.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.141.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.142.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.142.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.142.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.143.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.143.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.143.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.144.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.144.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.144.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.145.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.145.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.145.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.146.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.146.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.146.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.147.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.147.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.147.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.148.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.148.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.148.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.149.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.149.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.149.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.15.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.15.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.15.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.150.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.150.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.150.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.151.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.151.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.151.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.152.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.152.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.152.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.153.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.153.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.153.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.154.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.154.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.154.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.155.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.155.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.155.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.156.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.156.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.156.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.157.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.157.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.157.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.158.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.158.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.158.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.159.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.159.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.159.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.experts.16.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.16.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.16.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.17.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.17.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.17.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.18.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.18.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.18.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.19.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.19.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.19.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.2.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.2.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.2.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.20.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.20.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.20.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.21.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.21.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.21.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.22.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.22.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.22.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.23.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.23.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.23.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.24.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.24.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.24.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.25.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.25.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.25.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.26.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.26.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.26.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.27.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.27.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.27.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.28.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.28.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.28.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.29.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.29.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.29.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.3.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.3.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.3.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.30.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.30.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.30.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.31.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.31.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.31.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.32.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.32.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.32.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.33.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.33.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.33.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.34.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.34.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.34.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.35.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.35.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.35.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.36.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.36.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.36.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.37.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.37.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.37.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.38.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.38.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.38.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.39.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.39.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.39.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.4.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.4.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.4.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.40.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.40.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.40.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.41.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.41.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.41.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.42.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.42.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.42.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.43.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.43.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.43.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.44.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.44.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.44.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.45.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.45.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.45.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.46.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.46.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.46.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.47.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.47.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.47.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.48.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.48.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.48.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.49.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.49.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.49.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.5.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.5.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.5.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.50.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.50.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.50.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.51.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.51.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.51.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.52.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.52.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.52.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.53.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.53.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.53.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.54.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.54.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.54.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.55.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.55.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.55.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.56.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.56.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.56.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.57.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.57.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.57.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.58.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.58.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.58.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.59.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.59.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.59.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.6.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.6.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.6.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.60.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.60.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.60.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.61.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.61.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.61.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.62.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.62.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.62.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.63.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.63.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.64.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.64.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.65.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.65.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.65.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.66.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.66.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.66.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.67.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.67.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.67.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.68.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.68.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.68.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.69.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.69.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.69.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.7.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.7.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.70.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.70.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.70.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.71.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.71.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.71.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.72.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.72.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.72.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.73.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.73.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.73.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.74.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.74.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.74.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.75.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.75.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.75.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.76.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.76.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.76.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.77.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.77.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.77.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.78.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.78.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.78.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.79.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.79.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.79.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.8.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.8.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.8.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.80.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.80.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.80.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.81.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.81.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.81.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.82.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.82.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.82.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.83.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.83.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.83.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.84.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.84.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.84.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.85.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.85.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.85.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.86.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.86.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.86.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.87.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.87.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.87.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.88.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.88.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.88.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.89.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.89.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.89.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.9.down_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.9.gate_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.9.up_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.mlp.experts.90.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.90.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.90.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.91.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.91.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.91.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.92.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.92.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.92.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.93.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.93.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.93.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.94.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.94.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.94.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.95.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.95.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.95.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.96.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.96.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.96.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.97.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.97.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.97.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.98.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.98.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.98.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.99.down_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.99.gate_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.experts.99.up_proj.weight": "model-00029-of-00142.safetensors", + "model.layers.20.mlp.gate.e_score_correction_bias": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.gate.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.shared_experts.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.shared_experts.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.mlp.shared_experts.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00030-of-00142.safetensors", + "model.layers.20.self_attn.k_norm.weight": "model-00028-of-00142.safetensors", + "model.layers.20.self_attn.k_proj.bias": "model-00028-of-00142.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.self_attn.q_norm.weight": "model-00028-of-00142.safetensors", + "model.layers.20.self_attn.q_proj.bias": "model-00028-of-00142.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.20.self_attn.v_proj.bias": "model-00028-of-00142.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00028-of-00142.safetensors", + "model.layers.21.input_layernorm.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.0.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.0.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.1.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.1.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.10.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.10.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.10.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.100.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.100.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.100.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.101.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.101.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.101.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.102.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.102.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.102.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.103.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.103.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.103.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.104.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.104.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.104.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.105.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.105.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.105.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.106.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.106.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.106.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.107.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.107.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.107.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.108.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.108.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.108.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.109.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.109.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.109.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.11.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.11.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.11.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.110.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.110.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.110.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.111.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.111.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.111.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.112.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.112.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.112.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.113.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.113.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.113.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.114.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.114.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.114.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.115.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.115.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.115.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.116.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.116.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.116.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.117.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.117.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.117.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.118.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.118.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.118.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.119.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.119.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.119.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.12.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.12.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.12.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.120.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.120.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.120.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.121.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.121.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.121.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.122.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.122.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.122.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.123.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.123.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.123.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.124.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.124.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.124.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.125.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.125.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.125.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.126.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.126.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.126.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.127.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.127.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.127.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.128.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.128.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.128.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.129.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.129.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.129.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.13.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.13.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.13.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.130.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.130.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.130.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.131.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.131.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.131.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.132.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.132.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.132.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.133.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.133.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.133.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.134.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.134.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.134.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.135.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.135.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.135.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.136.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.136.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.136.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.137.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.137.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.137.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.138.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.138.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.138.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.139.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.139.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.139.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.14.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.14.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.14.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.140.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.140.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.140.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.141.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.141.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.141.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.142.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.142.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.142.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.143.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.143.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.143.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.144.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.144.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.144.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.145.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.145.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.145.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.146.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.146.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.146.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.147.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.147.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.147.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.148.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.148.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.148.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.149.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.149.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.149.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.15.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.15.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.15.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.150.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.150.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.150.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.151.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.151.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.151.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.152.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.152.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.152.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.153.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.153.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.153.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.154.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.154.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.154.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.155.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.155.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.155.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.156.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.156.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.156.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.157.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.157.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.157.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.158.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.158.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.158.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.159.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.159.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.159.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.16.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.16.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.16.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.17.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.17.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.17.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.18.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.18.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.18.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.19.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.19.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.19.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.2.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.2.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.20.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.20.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.20.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.21.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.21.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.21.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.22.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.22.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.22.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.23.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.23.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.23.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.24.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.24.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.24.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.25.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.25.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.25.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.26.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.26.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.26.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.27.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.27.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.27.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.28.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.28.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.28.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.29.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.29.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.29.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.3.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.3.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.30.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.30.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.30.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.31.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.31.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.31.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.32.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.32.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.32.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.33.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.33.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.33.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.34.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.34.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.34.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.35.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.35.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.35.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.36.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.36.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.36.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.37.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.37.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.37.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.38.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.38.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.38.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.39.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.39.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.39.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.4.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.4.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.40.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.40.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.40.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.41.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.41.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.41.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.42.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.42.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.42.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.43.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.43.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.43.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.44.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.44.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.44.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.45.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.45.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.45.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.46.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.46.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.46.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.47.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.47.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.47.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.48.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.48.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.48.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.49.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.49.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.49.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.5.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.5.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.50.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.50.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.50.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.51.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.51.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.51.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.52.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.52.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.52.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.53.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.53.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.53.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.54.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.54.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.54.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.55.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.55.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.55.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.56.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.56.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.56.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.57.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.57.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.57.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.58.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.58.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.58.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.59.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.59.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.59.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.6.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.6.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.60.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.60.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.60.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.61.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.61.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.61.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.62.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.62.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.62.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.63.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.63.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.64.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.64.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.65.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.65.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.65.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.66.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.66.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.66.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.67.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.67.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.67.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.68.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.68.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.68.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.69.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.69.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.69.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.7.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.7.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.70.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.70.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.70.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.71.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.71.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.71.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.72.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.72.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.72.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.73.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.73.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.73.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.74.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.74.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.74.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.75.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.75.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.75.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.76.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.76.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.76.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.77.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.77.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.77.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.78.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.78.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.78.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.79.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.79.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.79.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.8.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.8.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.8.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.80.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.80.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.80.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.81.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.81.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.81.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.82.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.82.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.82.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.83.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.83.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.83.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.84.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.84.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.84.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.85.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.85.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.85.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.86.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.86.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.86.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.87.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.87.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.87.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.88.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.88.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.88.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.89.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.89.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.89.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.9.down_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.9.gate_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.9.up_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.mlp.experts.90.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.90.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.90.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.91.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.91.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.91.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.92.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.92.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.92.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.93.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.93.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.93.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.94.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.94.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.94.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.95.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.95.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.95.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.96.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.96.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.96.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.97.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.97.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.97.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.98.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.98.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.98.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.99.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.99.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.experts.99.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.gate.e_score_correction_bias": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.gate.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.shared_experts.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.shared_experts.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.mlp.shared_experts.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00031-of-00142.safetensors", + "model.layers.21.self_attn.k_norm.weight": "model-00030-of-00142.safetensors", + "model.layers.21.self_attn.k_proj.bias": "model-00030-of-00142.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.self_attn.q_norm.weight": "model-00030-of-00142.safetensors", + "model.layers.21.self_attn.q_proj.bias": "model-00030-of-00142.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.21.self_attn.v_proj.bias": "model-00030-of-00142.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00030-of-00142.safetensors", + "model.layers.22.input_layernorm.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.0.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.0.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.0.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.1.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.1.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.1.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.10.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.10.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.10.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.100.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.100.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.100.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.101.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.101.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.101.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.102.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.102.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.102.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.103.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.103.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.103.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.104.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.104.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.104.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.105.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.105.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.105.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.106.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.106.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.106.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.107.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.107.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.107.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.108.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.108.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.108.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.109.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.109.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.109.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.11.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.11.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.11.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.110.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.110.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.110.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.111.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.111.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.111.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.112.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.112.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.112.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.113.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.113.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.113.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.114.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.114.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.114.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.115.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.115.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.115.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.116.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.116.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.116.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.117.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.117.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.117.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.118.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.118.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.118.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.119.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.119.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.119.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.12.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.12.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.12.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.120.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.120.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.120.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.121.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.121.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.121.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.122.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.122.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.122.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.123.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.123.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.123.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.124.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.124.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.124.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.125.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.125.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.125.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.126.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.126.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.126.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.127.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.127.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.127.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.128.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.128.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.128.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.129.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.129.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.129.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.13.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.13.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.13.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.130.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.130.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.130.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.131.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.131.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.131.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.132.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.132.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.132.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.133.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.133.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.133.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.134.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.134.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.134.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.135.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.135.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.135.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.136.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.136.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.136.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.137.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.137.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.137.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.138.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.138.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.138.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.139.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.139.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.139.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.14.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.14.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.14.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.140.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.140.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.140.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.141.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.141.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.141.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.142.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.142.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.142.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.143.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.143.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.143.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.144.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.144.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.144.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.145.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.145.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.145.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.146.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.146.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.146.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.147.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.147.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.147.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.148.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.148.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.148.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.149.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.149.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.149.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.15.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.15.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.15.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.150.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.150.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.150.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.151.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.151.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.151.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.152.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.152.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.152.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.153.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.153.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.153.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.154.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.154.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.154.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.155.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.155.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.155.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.156.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.156.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.156.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.157.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.157.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.157.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.158.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.158.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.158.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.159.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.159.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.159.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.experts.16.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.16.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.16.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.17.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.17.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.17.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.18.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.18.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.18.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.19.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.19.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.19.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.2.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.2.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.2.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.20.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.20.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.20.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.21.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.21.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.21.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.22.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.22.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.22.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.23.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.23.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.23.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.24.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.24.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.24.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.25.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.25.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.25.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.26.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.26.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.26.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.27.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.27.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.27.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.28.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.28.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.28.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.29.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.29.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.29.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.3.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.3.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.3.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.30.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.30.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.30.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.31.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.31.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.31.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.32.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.32.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.32.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.33.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.33.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.33.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.34.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.34.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.34.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.35.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.35.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.35.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.36.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.36.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.36.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.37.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.37.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.37.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.38.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.38.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.38.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.39.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.39.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.39.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.4.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.4.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.4.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.40.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.40.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.40.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.41.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.41.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.41.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.42.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.42.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.42.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.43.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.43.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.43.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.44.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.44.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.44.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.45.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.45.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.45.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.46.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.46.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.46.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.47.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.47.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.47.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.48.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.48.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.48.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.49.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.49.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.49.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.5.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.5.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.5.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.50.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.50.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.50.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.51.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.51.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.51.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.52.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.52.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.52.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.53.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.53.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.53.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.54.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.54.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.54.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.55.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.55.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.55.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.56.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.56.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.56.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.57.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.57.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.57.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.58.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.58.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.58.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.59.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.59.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.59.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.6.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.6.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.6.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.60.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.60.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.60.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.61.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.61.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.61.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.62.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.62.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.62.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.63.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.63.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.64.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.64.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.65.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.65.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.65.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.66.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.66.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.66.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.67.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.67.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.67.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.68.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.68.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.68.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.69.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.69.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.69.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.7.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.7.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.70.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.70.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.70.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.71.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.71.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.71.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.72.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.72.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.72.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.73.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.73.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.73.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.74.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.74.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.74.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.75.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.75.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.75.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.76.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.76.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.76.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.77.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.77.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.77.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.78.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.78.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.78.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.79.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.79.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.79.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.8.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.8.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.8.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.80.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.80.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.80.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.81.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.81.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.81.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.82.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.82.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.82.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.83.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.83.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.83.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.84.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.84.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.84.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.85.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.85.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.85.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.86.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.86.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.86.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.87.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.87.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.87.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.88.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.88.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.88.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.89.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.89.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.89.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.9.down_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.9.gate_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.9.up_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.mlp.experts.90.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.90.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.90.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.91.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.91.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.91.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.92.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.92.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.92.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.93.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.93.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.93.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.94.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.94.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.94.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.95.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.95.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.95.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.96.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.96.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.96.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.97.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.97.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.97.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.98.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.98.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.98.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.99.down_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.99.gate_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.experts.99.up_proj.weight": "model-00032-of-00142.safetensors", + "model.layers.22.mlp.gate.e_score_correction_bias": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.gate.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.shared_experts.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.shared_experts.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.mlp.shared_experts.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00033-of-00142.safetensors", + "model.layers.22.self_attn.k_norm.weight": "model-00031-of-00142.safetensors", + "model.layers.22.self_attn.k_proj.bias": "model-00031-of-00142.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.self_attn.q_norm.weight": "model-00031-of-00142.safetensors", + "model.layers.22.self_attn.q_proj.bias": "model-00031-of-00142.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.22.self_attn.v_proj.bias": "model-00031-of-00142.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00031-of-00142.safetensors", + "model.layers.23.input_layernorm.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.0.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.0.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.1.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.1.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.10.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.10.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.10.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.100.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.100.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.100.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.101.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.101.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.101.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.102.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.102.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.102.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.103.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.103.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.103.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.104.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.104.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.104.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.105.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.105.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.105.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.106.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.106.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.106.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.107.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.107.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.107.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.108.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.108.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.108.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.109.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.109.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.109.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.11.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.11.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.11.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.110.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.110.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.110.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.111.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.111.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.111.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.112.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.112.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.112.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.113.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.113.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.113.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.114.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.114.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.114.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.115.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.115.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.115.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.116.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.116.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.116.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.117.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.117.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.117.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.118.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.118.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.118.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.119.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.119.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.119.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.12.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.12.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.12.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.120.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.120.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.120.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.121.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.121.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.121.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.122.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.122.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.122.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.123.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.123.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.123.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.124.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.124.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.124.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.125.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.125.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.125.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.126.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.126.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.126.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.127.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.127.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.127.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.128.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.128.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.128.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.129.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.129.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.129.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.13.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.13.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.13.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.130.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.130.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.130.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.131.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.131.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.131.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.132.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.132.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.132.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.133.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.133.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.133.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.134.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.134.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.134.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.135.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.135.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.135.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.136.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.136.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.136.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.137.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.137.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.137.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.138.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.138.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.138.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.139.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.139.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.139.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.14.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.14.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.14.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.140.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.140.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.140.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.141.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.141.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.141.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.142.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.142.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.142.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.143.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.143.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.143.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.144.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.144.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.144.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.145.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.145.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.145.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.146.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.146.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.146.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.147.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.147.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.147.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.148.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.148.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.148.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.149.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.149.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.149.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.15.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.15.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.15.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.150.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.150.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.150.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.151.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.151.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.151.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.152.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.152.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.152.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.153.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.153.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.153.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.154.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.154.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.154.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.155.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.155.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.155.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.156.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.156.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.156.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.157.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.157.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.157.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.158.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.158.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.158.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.159.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.159.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.159.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.16.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.16.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.16.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.17.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.17.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.17.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.18.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.18.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.18.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.19.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.19.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.19.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.2.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.2.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.20.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.20.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.20.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.21.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.21.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.21.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.22.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.22.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.22.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.23.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.23.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.23.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.24.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.24.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.24.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.25.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.25.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.25.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.26.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.26.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.26.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.27.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.27.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.27.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.28.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.28.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.28.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.29.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.29.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.29.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.3.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.3.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.30.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.30.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.30.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.31.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.31.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.31.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.32.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.32.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.32.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.33.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.33.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.33.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.34.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.34.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.34.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.35.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.35.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.35.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.36.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.36.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.36.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.37.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.37.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.37.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.38.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.38.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.38.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.39.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.39.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.39.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.4.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.4.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.40.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.40.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.40.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.41.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.41.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.41.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.42.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.42.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.42.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.43.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.43.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.43.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.44.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.44.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.44.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.45.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.45.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.45.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.46.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.46.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.46.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.47.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.47.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.47.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.48.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.48.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.48.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.49.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.49.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.49.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.5.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.5.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.50.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.50.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.50.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.51.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.51.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.51.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.52.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.52.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.52.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.53.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.53.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.53.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.54.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.54.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.54.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.55.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.55.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.55.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.56.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.56.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.56.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.57.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.57.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.57.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.58.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.58.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.58.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.59.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.59.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.59.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.6.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.6.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.60.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.60.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.60.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.61.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.61.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.61.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.62.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.62.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.62.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.63.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.63.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.64.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.64.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.65.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.65.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.65.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.66.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.66.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.66.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.67.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.67.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.67.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.68.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.68.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.68.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.69.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.69.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.69.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.7.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.7.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.70.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.70.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.70.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.71.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.71.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.71.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.72.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.72.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.72.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.73.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.73.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.73.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.74.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.74.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.74.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.75.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.75.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.75.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.76.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.76.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.76.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.77.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.77.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.77.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.78.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.78.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.78.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.79.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.79.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.79.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.8.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.8.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.8.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.80.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.80.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.80.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.81.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.81.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.81.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.82.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.82.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.82.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.83.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.83.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.83.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.84.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.84.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.84.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.85.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.85.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.85.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.86.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.86.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.86.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.87.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.87.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.87.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.88.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.88.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.88.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.89.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.89.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.89.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.9.down_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.9.gate_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.9.up_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.mlp.experts.90.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.90.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.90.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.91.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.91.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.91.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.92.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.92.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.92.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.93.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.93.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.93.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.94.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.94.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.94.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.95.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.95.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.95.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.96.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.96.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.96.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.97.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.97.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.97.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.98.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.98.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.98.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.99.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.99.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.experts.99.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.gate.e_score_correction_bias": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.gate.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.shared_experts.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.shared_experts.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.mlp.shared_experts.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00034-of-00142.safetensors", + "model.layers.23.self_attn.k_norm.weight": "model-00033-of-00142.safetensors", + "model.layers.23.self_attn.k_proj.bias": "model-00033-of-00142.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.self_attn.q_norm.weight": "model-00033-of-00142.safetensors", + "model.layers.23.self_attn.q_proj.bias": "model-00033-of-00142.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.23.self_attn.v_proj.bias": "model-00033-of-00142.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00033-of-00142.safetensors", + "model.layers.24.input_layernorm.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.0.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.0.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.0.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.1.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.1.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.1.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.10.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.10.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.10.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.100.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.100.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.100.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.101.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.101.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.101.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.102.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.102.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.102.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.103.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.103.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.103.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.104.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.104.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.104.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.105.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.105.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.105.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.106.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.106.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.106.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.107.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.107.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.107.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.108.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.108.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.108.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.109.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.109.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.109.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.11.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.11.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.11.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.110.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.110.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.110.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.111.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.111.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.111.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.112.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.112.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.112.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.113.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.113.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.113.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.114.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.114.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.114.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.115.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.115.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.115.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.116.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.116.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.116.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.117.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.117.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.117.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.118.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.118.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.118.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.119.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.119.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.119.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.12.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.12.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.12.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.120.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.120.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.120.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.121.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.121.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.121.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.122.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.122.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.122.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.123.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.123.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.123.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.124.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.124.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.124.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.125.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.125.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.125.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.126.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.126.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.126.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.127.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.127.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.127.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.128.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.128.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.128.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.129.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.129.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.129.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.13.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.13.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.13.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.130.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.130.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.130.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.131.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.131.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.131.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.132.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.132.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.132.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.133.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.133.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.133.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.134.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.134.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.134.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.135.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.135.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.135.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.136.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.136.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.136.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.137.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.137.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.137.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.138.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.138.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.138.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.139.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.139.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.139.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.14.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.14.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.14.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.140.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.140.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.140.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.141.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.141.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.141.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.142.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.142.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.142.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.143.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.143.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.143.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.144.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.144.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.144.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.145.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.145.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.145.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.146.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.146.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.146.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.147.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.147.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.147.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.148.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.148.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.148.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.149.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.149.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.149.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.15.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.15.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.15.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.150.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.150.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.150.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.151.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.151.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.151.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.152.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.152.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.152.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.153.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.153.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.153.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.154.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.154.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.154.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.155.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.155.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.155.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.156.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.156.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.156.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.157.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.157.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.157.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.158.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.158.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.158.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.159.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.159.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.159.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.experts.16.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.16.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.16.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.17.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.17.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.17.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.18.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.18.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.18.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.19.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.19.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.19.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.2.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.2.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.2.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.20.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.20.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.20.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.21.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.21.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.21.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.22.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.22.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.22.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.23.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.23.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.23.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.24.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.24.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.24.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.25.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.25.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.25.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.26.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.26.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.26.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.27.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.27.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.27.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.28.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.28.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.28.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.29.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.29.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.29.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.3.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.3.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.3.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.30.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.30.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.30.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.31.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.31.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.31.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.32.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.32.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.32.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.33.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.33.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.33.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.34.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.34.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.34.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.35.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.35.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.35.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.36.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.36.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.36.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.37.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.37.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.37.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.38.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.38.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.38.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.39.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.39.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.39.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.4.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.4.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.4.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.40.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.40.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.40.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.41.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.41.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.41.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.42.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.42.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.42.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.43.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.43.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.43.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.44.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.44.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.44.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.45.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.45.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.45.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.46.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.46.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.46.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.47.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.47.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.47.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.48.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.48.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.48.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.49.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.49.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.49.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.5.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.5.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.5.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.50.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.50.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.50.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.51.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.51.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.51.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.52.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.52.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.52.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.53.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.53.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.53.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.54.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.54.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.54.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.55.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.55.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.55.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.56.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.56.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.56.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.57.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.57.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.57.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.58.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.58.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.58.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.59.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.59.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.59.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.6.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.6.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.6.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.60.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.60.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.60.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.61.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.61.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.61.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.62.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.62.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.62.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.63.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.63.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.64.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.64.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.65.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.65.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.65.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.66.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.66.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.66.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.67.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.67.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.67.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.68.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.68.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.68.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.69.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.69.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.69.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.7.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.7.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.70.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.70.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.70.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.71.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.71.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.71.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.72.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.72.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.72.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.73.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.73.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.73.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.74.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.74.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.74.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.75.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.75.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.75.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.76.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.76.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.76.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.77.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.77.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.77.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.78.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.78.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.78.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.79.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.79.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.79.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.8.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.8.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.8.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.80.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.80.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.80.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.81.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.81.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.81.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.82.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.82.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.82.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.83.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.83.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.83.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.84.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.84.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.84.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.85.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.85.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.85.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.86.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.86.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.86.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.87.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.87.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.87.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.88.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.88.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.88.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.89.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.89.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.89.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.9.down_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.9.gate_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.9.up_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.mlp.experts.90.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.90.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.90.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.91.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.91.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.91.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.92.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.92.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.92.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.93.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.93.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.93.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.94.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.94.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.94.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.95.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.95.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.95.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.96.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.96.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.96.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.97.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.97.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.97.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.98.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.98.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.98.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.99.down_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.99.gate_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.experts.99.up_proj.weight": "model-00035-of-00142.safetensors", + "model.layers.24.mlp.gate.e_score_correction_bias": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.gate.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.shared_experts.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.shared_experts.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.mlp.shared_experts.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00036-of-00142.safetensors", + "model.layers.24.self_attn.k_norm.weight": "model-00034-of-00142.safetensors", + "model.layers.24.self_attn.k_proj.bias": "model-00034-of-00142.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.self_attn.q_norm.weight": "model-00034-of-00142.safetensors", + "model.layers.24.self_attn.q_proj.bias": "model-00034-of-00142.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.24.self_attn.v_proj.bias": "model-00034-of-00142.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00034-of-00142.safetensors", + "model.layers.25.input_layernorm.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.0.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.0.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.1.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.1.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.10.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.10.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.10.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.100.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.100.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.100.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.101.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.101.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.101.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.102.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.102.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.102.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.103.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.103.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.103.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.104.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.104.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.104.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.105.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.105.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.105.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.106.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.106.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.106.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.107.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.107.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.107.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.108.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.108.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.108.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.109.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.109.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.109.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.11.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.11.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.11.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.110.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.110.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.110.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.111.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.111.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.111.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.112.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.112.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.112.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.113.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.113.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.113.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.114.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.114.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.114.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.115.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.115.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.115.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.116.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.116.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.116.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.117.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.117.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.117.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.118.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.118.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.118.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.119.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.119.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.119.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.12.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.12.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.12.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.120.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.120.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.120.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.121.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.121.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.121.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.122.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.122.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.122.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.123.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.123.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.123.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.124.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.124.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.124.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.125.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.125.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.125.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.126.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.126.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.126.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.127.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.127.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.127.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.128.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.128.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.128.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.129.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.129.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.129.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.13.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.13.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.13.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.130.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.130.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.130.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.131.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.131.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.131.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.132.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.132.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.132.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.133.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.133.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.133.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.134.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.134.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.134.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.135.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.135.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.135.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.136.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.136.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.136.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.137.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.137.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.137.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.138.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.138.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.138.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.139.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.139.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.139.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.14.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.14.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.14.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.140.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.140.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.140.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.141.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.141.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.141.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.142.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.142.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.142.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.143.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.143.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.143.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.144.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.144.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.144.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.145.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.145.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.145.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.146.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.146.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.146.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.147.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.147.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.147.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.148.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.148.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.148.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.149.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.149.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.149.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.15.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.15.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.15.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.150.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.150.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.150.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.151.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.151.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.151.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.152.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.152.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.152.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.153.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.153.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.153.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.154.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.154.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.154.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.155.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.155.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.155.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.156.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.156.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.156.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.157.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.157.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.157.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.158.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.158.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.158.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.159.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.159.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.159.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.16.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.16.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.16.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.17.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.17.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.17.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.18.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.18.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.18.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.19.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.19.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.19.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.2.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.2.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.20.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.20.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.20.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.21.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.21.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.21.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.22.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.22.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.22.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.23.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.23.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.23.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.24.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.24.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.24.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.25.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.25.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.25.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.26.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.26.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.26.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.27.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.27.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.27.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.28.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.28.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.28.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.29.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.29.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.29.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.3.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.3.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.30.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.30.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.30.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.31.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.31.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.31.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.32.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.32.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.32.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.33.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.33.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.33.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.34.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.34.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.34.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.35.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.35.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.35.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.36.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.36.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.36.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.37.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.37.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.37.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.38.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.38.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.38.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.39.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.39.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.39.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.4.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.4.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.40.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.40.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.40.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.41.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.41.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.41.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.42.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.42.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.42.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.43.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.43.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.43.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.44.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.44.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.44.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.45.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.45.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.45.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.46.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.46.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.46.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.47.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.47.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.47.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.48.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.48.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.48.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.49.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.49.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.49.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.5.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.5.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.50.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.50.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.50.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.51.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.51.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.51.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.52.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.52.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.52.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.53.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.53.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.53.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.54.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.54.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.54.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.55.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.55.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.55.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.56.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.56.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.56.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.57.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.57.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.57.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.58.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.58.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.58.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.59.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.59.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.59.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.6.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.6.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.60.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.60.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.60.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.61.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.61.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.61.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.62.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.62.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.62.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.63.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.63.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.64.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.64.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.65.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.65.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.65.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.66.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.66.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.66.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.67.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.67.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.67.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.68.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.68.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.68.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.69.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.69.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.69.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.7.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.7.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.70.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.70.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.70.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.71.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.71.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.71.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.72.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.72.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.72.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.73.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.73.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.73.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.74.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.74.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.74.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.75.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.75.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.75.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.76.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.76.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.76.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.77.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.77.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.77.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.78.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.78.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.78.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.79.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.79.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.79.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.8.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.8.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.8.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.80.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.80.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.80.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.81.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.81.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.81.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.82.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.82.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.82.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.83.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.83.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.83.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.84.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.84.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.84.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.85.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.85.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.85.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.86.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.86.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.86.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.87.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.87.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.87.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.88.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.88.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.88.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.89.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.89.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.89.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.9.down_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.9.gate_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.9.up_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.mlp.experts.90.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.90.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.90.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.91.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.91.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.91.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.92.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.92.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.92.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.93.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.93.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.93.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.94.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.94.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.94.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.95.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.95.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.95.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.96.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.96.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.96.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.97.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.97.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.97.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.98.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.98.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.98.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.99.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.99.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.experts.99.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.gate.e_score_correction_bias": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.gate.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.shared_experts.down_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.shared_experts.gate_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.mlp.shared_experts.up_proj.weight": "model-00037-of-00142.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00037-of-00142.safetensors", + "model.layers.25.self_attn.k_norm.weight": "model-00036-of-00142.safetensors", + "model.layers.25.self_attn.k_proj.bias": "model-00036-of-00142.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.self_attn.q_norm.weight": "model-00036-of-00142.safetensors", + "model.layers.25.self_attn.q_proj.bias": "model-00036-of-00142.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.25.self_attn.v_proj.bias": "model-00036-of-00142.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00036-of-00142.safetensors", + "model.layers.26.input_layernorm.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.0.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.0.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.0.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.1.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.1.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.1.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.10.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.10.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.10.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.100.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.100.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.100.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.101.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.101.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.101.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.102.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.102.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.102.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.103.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.103.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.103.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.104.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.104.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.104.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.105.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.105.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.105.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.106.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.106.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.106.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.107.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.107.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.107.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.108.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.108.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.108.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.109.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.109.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.109.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.11.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.11.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.11.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.110.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.110.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.110.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.111.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.111.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.111.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.112.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.112.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.112.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.113.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.113.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.113.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.114.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.114.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.114.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.115.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.115.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.115.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.116.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.116.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.116.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.117.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.117.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.117.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.118.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.118.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.118.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.119.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.119.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.119.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.12.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.12.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.12.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.120.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.120.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.120.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.121.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.121.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.121.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.122.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.122.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.122.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.123.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.123.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.123.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.124.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.124.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.124.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.125.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.125.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.125.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.126.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.126.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.126.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.127.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.127.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.127.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.128.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.128.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.128.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.129.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.129.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.129.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.13.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.13.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.13.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.130.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.130.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.130.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.131.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.131.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.131.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.132.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.132.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.132.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.133.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.133.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.133.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.134.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.134.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.134.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.135.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.135.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.135.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.136.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.136.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.136.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.137.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.137.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.137.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.138.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.138.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.138.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.139.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.139.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.139.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.14.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.14.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.14.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.140.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.140.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.140.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.141.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.141.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.141.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.142.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.142.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.142.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.143.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.143.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.143.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.144.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.144.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.144.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.145.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.145.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.145.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.146.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.146.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.146.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.147.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.147.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.147.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.148.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.148.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.148.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.149.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.149.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.149.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.15.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.15.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.15.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.150.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.150.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.150.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.151.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.151.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.151.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.152.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.152.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.152.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.153.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.153.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.153.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.154.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.154.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.154.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.155.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.155.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.155.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.156.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.156.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.156.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.157.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.157.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.157.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.158.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.158.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.158.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.159.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.159.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.159.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.experts.16.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.16.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.16.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.17.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.17.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.17.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.18.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.18.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.18.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.19.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.19.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.19.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.2.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.2.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.2.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.20.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.20.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.20.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.21.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.21.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.21.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.22.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.22.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.22.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.23.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.23.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.23.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.24.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.24.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.24.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.25.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.25.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.25.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.26.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.26.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.26.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.27.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.27.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.27.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.28.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.28.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.28.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.29.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.29.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.29.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.3.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.3.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.3.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.30.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.30.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.30.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.31.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.31.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.31.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.32.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.32.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.32.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.33.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.33.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.33.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.34.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.34.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.34.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.35.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.35.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.35.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.36.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.36.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.36.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.37.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.37.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.37.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.38.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.38.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.38.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.39.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.39.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.39.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.4.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.4.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.4.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.40.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.40.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.40.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.41.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.41.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.41.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.42.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.42.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.42.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.43.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.43.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.43.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.44.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.44.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.44.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.45.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.45.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.45.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.46.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.46.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.46.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.47.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.47.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.47.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.48.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.48.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.48.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.49.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.49.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.49.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.5.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.5.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.5.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.50.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.50.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.50.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.51.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.51.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.51.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.52.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.52.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.52.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.53.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.53.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.53.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.54.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.54.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.54.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.55.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.55.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.55.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.56.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.56.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.56.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.57.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.57.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.57.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.58.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.58.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.58.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.59.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.59.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.59.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.6.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.6.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.6.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.60.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.60.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.60.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.61.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.61.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.61.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.62.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.62.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.62.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.63.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.63.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.64.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.64.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.65.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.65.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.65.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.66.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.66.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.66.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.67.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.67.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.67.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.68.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.68.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.68.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.69.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.69.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.69.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.7.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.7.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.70.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.70.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.70.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.71.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.71.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.71.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.72.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.72.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.72.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.73.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.73.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.73.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.74.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.74.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.74.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.75.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.75.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.75.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.76.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.76.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.76.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.77.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.77.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.77.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.78.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.78.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.78.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.79.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.79.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.79.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.8.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.8.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.8.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.80.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.80.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.80.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.81.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.81.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.81.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.82.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.82.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.82.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.83.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.83.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.83.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.84.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.84.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.84.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.85.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.85.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.85.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.86.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.86.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.86.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.87.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.87.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.87.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.88.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.88.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.88.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.89.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.89.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.89.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.9.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.9.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.9.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.90.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.90.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.90.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.91.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.91.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.91.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.92.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.92.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.92.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.93.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.93.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.93.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.94.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.94.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.94.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.95.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.95.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.95.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.96.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.96.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.96.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.97.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.97.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.97.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.98.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.98.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.98.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.99.down_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.99.gate_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.experts.99.up_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.mlp.gate.e_score_correction_bias": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.gate.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.shared_experts.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.shared_experts.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.mlp.shared_experts.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00039-of-00142.safetensors", + "model.layers.26.self_attn.k_norm.weight": "model-00038-of-00142.safetensors", + "model.layers.26.self_attn.k_proj.bias": "model-00038-of-00142.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.self_attn.q_norm.weight": "model-00038-of-00142.safetensors", + "model.layers.26.self_attn.q_proj.bias": "model-00038-of-00142.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.26.self_attn.v_proj.bias": "model-00038-of-00142.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00038-of-00142.safetensors", + "model.layers.27.input_layernorm.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.0.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.0.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.1.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.1.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.10.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.10.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.10.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.100.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.100.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.100.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.101.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.101.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.101.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.102.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.102.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.102.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.103.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.103.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.103.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.104.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.104.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.104.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.105.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.105.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.105.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.106.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.106.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.106.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.107.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.107.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.107.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.108.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.108.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.108.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.109.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.109.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.109.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.11.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.11.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.11.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.110.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.110.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.110.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.111.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.111.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.111.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.112.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.112.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.112.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.113.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.113.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.113.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.114.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.114.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.114.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.115.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.115.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.115.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.116.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.116.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.116.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.117.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.117.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.117.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.118.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.118.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.118.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.119.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.119.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.119.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.12.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.12.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.12.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.120.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.120.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.120.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.121.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.121.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.121.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.122.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.122.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.122.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.123.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.123.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.123.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.124.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.124.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.124.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.125.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.125.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.125.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.126.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.126.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.126.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.127.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.127.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.127.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.128.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.128.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.128.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.129.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.129.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.129.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.13.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.13.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.13.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.130.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.130.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.130.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.131.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.131.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.131.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.132.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.132.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.132.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.133.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.133.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.133.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.134.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.134.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.134.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.135.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.135.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.135.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.136.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.136.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.136.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.137.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.137.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.137.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.138.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.138.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.138.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.139.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.139.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.139.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.14.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.14.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.14.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.140.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.140.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.140.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.141.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.141.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.141.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.142.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.142.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.142.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.143.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.143.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.143.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.144.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.144.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.144.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.145.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.145.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.145.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.146.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.146.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.146.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.147.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.147.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.147.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.148.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.148.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.148.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.149.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.149.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.149.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.15.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.15.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.15.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.150.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.150.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.150.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.151.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.151.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.151.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.152.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.152.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.152.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.153.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.153.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.153.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.154.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.154.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.154.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.155.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.155.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.155.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.156.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.156.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.156.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.157.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.157.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.157.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.158.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.158.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.158.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.159.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.159.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.159.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.experts.16.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.16.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.16.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.17.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.17.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.17.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.18.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.18.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.18.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.19.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.19.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.19.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.2.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.2.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.20.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.20.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.20.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.21.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.21.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.21.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.22.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.22.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.22.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.23.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.23.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.23.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.24.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.24.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.24.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.25.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.25.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.25.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.26.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.26.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.26.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.27.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.27.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.27.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.28.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.28.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.28.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.29.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.29.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.29.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.3.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.3.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.30.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.30.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.30.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.31.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.31.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.31.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.32.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.32.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.32.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.33.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.33.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.33.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.34.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.34.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.34.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.35.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.35.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.35.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.36.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.36.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.36.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.37.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.37.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.37.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.38.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.38.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.38.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.39.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.39.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.39.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.4.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.4.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.40.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.40.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.40.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.41.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.41.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.41.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.42.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.42.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.42.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.43.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.43.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.43.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.44.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.44.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.44.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.45.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.45.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.45.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.46.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.46.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.46.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.47.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.47.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.47.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.48.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.48.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.48.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.49.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.49.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.49.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.5.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.5.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.50.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.50.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.50.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.51.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.51.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.51.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.52.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.52.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.52.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.53.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.53.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.53.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.54.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.54.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.54.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.55.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.55.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.55.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.56.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.56.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.56.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.57.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.57.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.57.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.58.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.58.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.58.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.59.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.59.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.59.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.6.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.6.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.60.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.60.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.60.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.61.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.61.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.61.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.62.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.62.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.62.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.63.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.63.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.64.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.64.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.65.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.65.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.65.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.66.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.66.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.66.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.67.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.67.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.67.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.68.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.68.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.68.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.69.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.69.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.69.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.7.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.7.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.70.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.70.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.70.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.71.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.71.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.71.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.72.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.72.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.72.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.73.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.73.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.73.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.74.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.74.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.74.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.75.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.75.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.75.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.76.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.76.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.76.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.77.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.77.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.77.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.78.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.78.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.78.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.79.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.79.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.79.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.8.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.8.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.8.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.80.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.80.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.80.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.81.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.81.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.81.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.82.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.82.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.82.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.83.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.83.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.83.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.84.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.84.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.84.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.85.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.85.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.85.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.86.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.86.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.86.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.87.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.87.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.87.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.88.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.88.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.88.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.89.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.89.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.89.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.9.down_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.9.gate_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.9.up_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.mlp.experts.90.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.90.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.90.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.91.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.91.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.91.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.92.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.92.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.92.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.93.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.93.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.93.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.94.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.94.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.94.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.95.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.95.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.95.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.96.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.96.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.96.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.97.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.97.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.97.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.98.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.98.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.98.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.99.down_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.99.gate_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.experts.99.up_proj.weight": "model-00040-of-00142.safetensors", + "model.layers.27.mlp.gate.e_score_correction_bias": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.gate.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.shared_experts.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.shared_experts.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.mlp.shared_experts.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00041-of-00142.safetensors", + "model.layers.27.self_attn.k_norm.weight": "model-00039-of-00142.safetensors", + "model.layers.27.self_attn.k_proj.bias": "model-00039-of-00142.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.self_attn.q_norm.weight": "model-00039-of-00142.safetensors", + "model.layers.27.self_attn.q_proj.bias": "model-00039-of-00142.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.27.self_attn.v_proj.bias": "model-00039-of-00142.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00039-of-00142.safetensors", + "model.layers.28.input_layernorm.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.0.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.0.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.0.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.1.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.1.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.1.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.10.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.10.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.10.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.100.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.100.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.100.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.101.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.101.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.101.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.102.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.102.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.102.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.103.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.103.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.103.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.104.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.104.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.104.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.105.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.105.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.105.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.106.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.106.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.106.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.107.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.107.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.107.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.108.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.108.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.108.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.109.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.109.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.109.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.11.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.11.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.11.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.110.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.110.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.110.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.111.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.111.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.111.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.112.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.112.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.112.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.113.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.113.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.113.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.114.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.114.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.114.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.115.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.115.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.115.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.116.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.116.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.116.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.117.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.117.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.117.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.118.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.118.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.118.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.119.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.119.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.119.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.12.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.12.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.12.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.120.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.120.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.120.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.121.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.121.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.121.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.122.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.122.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.122.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.123.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.123.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.123.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.124.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.124.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.124.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.125.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.125.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.125.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.126.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.126.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.126.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.127.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.127.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.127.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.128.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.128.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.128.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.129.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.129.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.129.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.13.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.13.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.13.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.130.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.130.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.130.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.131.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.131.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.131.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.132.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.132.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.132.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.133.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.133.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.133.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.134.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.134.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.134.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.135.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.135.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.135.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.136.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.136.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.136.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.137.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.137.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.137.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.138.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.138.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.138.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.139.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.139.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.139.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.14.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.14.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.14.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.140.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.140.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.140.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.141.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.141.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.141.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.142.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.142.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.142.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.143.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.143.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.143.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.144.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.144.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.144.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.145.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.145.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.145.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.146.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.146.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.146.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.147.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.147.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.147.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.148.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.148.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.148.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.149.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.149.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.149.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.15.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.15.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.15.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.150.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.150.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.150.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.151.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.151.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.151.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.152.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.152.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.152.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.153.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.153.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.153.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.154.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.154.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.154.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.155.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.155.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.155.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.156.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.156.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.156.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.157.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.157.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.157.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.158.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.158.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.158.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.159.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.159.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.159.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.16.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.16.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.16.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.17.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.17.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.17.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.18.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.18.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.18.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.19.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.19.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.19.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.2.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.2.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.2.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.20.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.20.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.20.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.21.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.21.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.21.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.22.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.22.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.22.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.23.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.23.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.23.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.24.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.24.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.24.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.25.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.25.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.25.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.26.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.26.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.26.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.27.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.27.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.27.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.28.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.28.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.28.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.29.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.29.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.29.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.3.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.3.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.3.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.30.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.30.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.30.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.31.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.31.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.31.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.32.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.32.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.32.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.33.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.33.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.33.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.34.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.34.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.34.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.35.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.35.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.35.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.36.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.36.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.36.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.37.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.37.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.37.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.38.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.38.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.38.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.39.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.39.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.39.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.4.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.4.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.4.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.40.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.40.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.40.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.41.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.41.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.41.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.42.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.42.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.42.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.43.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.43.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.43.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.44.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.44.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.44.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.45.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.45.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.45.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.46.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.46.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.46.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.47.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.47.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.47.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.48.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.48.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.48.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.49.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.49.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.49.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.5.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.5.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.5.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.50.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.50.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.50.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.51.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.51.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.51.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.52.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.52.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.52.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.53.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.53.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.53.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.54.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.54.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.54.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.55.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.55.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.55.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.56.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.56.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.56.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.57.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.57.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.57.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.58.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.58.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.58.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.59.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.59.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.59.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.6.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.6.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.6.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.60.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.60.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.60.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.61.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.61.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.61.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.62.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.62.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.62.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.63.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.63.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.63.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.64.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.64.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.64.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.65.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.65.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.65.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.66.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.66.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.66.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.67.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.67.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.67.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.68.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.68.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.68.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.69.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.69.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.69.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.7.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.7.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.7.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.70.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.70.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.70.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.71.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.71.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.71.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.72.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.72.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.72.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.73.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.73.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.73.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.74.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.74.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.74.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.75.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.75.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.75.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.76.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.76.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.76.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.77.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.77.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.77.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.78.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.78.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.78.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.79.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.79.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.79.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.8.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.8.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.8.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.80.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.80.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.80.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.81.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.81.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.81.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.82.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.82.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.82.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.83.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.83.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.83.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.84.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.84.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.84.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.85.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.85.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.85.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.86.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.86.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.86.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.87.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.87.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.87.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.88.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.88.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.88.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.89.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.89.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.89.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.9.down_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.9.gate_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.9.up_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.mlp.experts.90.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.90.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.90.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.91.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.91.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.91.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.92.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.92.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.92.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.93.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.93.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.93.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.94.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.94.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.94.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.95.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.95.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.95.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.96.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.96.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.96.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.97.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.97.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.97.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.98.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.98.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.98.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.99.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.99.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.experts.99.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.gate.e_score_correction_bias": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.gate.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.shared_experts.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.shared_experts.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.mlp.shared_experts.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00042-of-00142.safetensors", + "model.layers.28.self_attn.k_norm.weight": "model-00041-of-00142.safetensors", + "model.layers.28.self_attn.k_proj.bias": "model-00041-of-00142.safetensors", + "model.layers.28.self_attn.k_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.self_attn.q_norm.weight": "model-00041-of-00142.safetensors", + "model.layers.28.self_attn.q_proj.bias": "model-00041-of-00142.safetensors", + "model.layers.28.self_attn.q_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.28.self_attn.v_proj.bias": "model-00041-of-00142.safetensors", + "model.layers.28.self_attn.v_proj.weight": "model-00041-of-00142.safetensors", + "model.layers.29.input_layernorm.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.0.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.0.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.1.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.1.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.10.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.10.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.10.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.100.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.100.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.100.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.101.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.101.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.101.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.102.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.102.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.102.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.103.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.103.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.103.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.104.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.104.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.104.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.105.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.105.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.105.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.106.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.106.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.106.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.107.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.107.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.107.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.108.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.108.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.108.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.109.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.109.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.109.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.11.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.11.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.11.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.110.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.110.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.110.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.111.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.111.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.111.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.112.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.112.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.112.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.113.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.113.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.113.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.114.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.114.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.114.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.115.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.115.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.115.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.116.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.116.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.116.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.117.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.117.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.117.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.118.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.118.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.118.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.119.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.119.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.119.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.12.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.12.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.12.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.120.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.120.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.120.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.121.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.121.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.121.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.122.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.122.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.122.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.123.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.123.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.123.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.124.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.124.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.124.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.125.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.125.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.125.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.126.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.126.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.126.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.127.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.127.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.127.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.128.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.128.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.128.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.129.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.129.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.129.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.13.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.13.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.13.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.130.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.130.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.130.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.131.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.131.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.131.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.132.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.132.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.132.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.133.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.133.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.133.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.134.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.134.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.134.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.135.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.135.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.135.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.136.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.136.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.136.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.137.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.137.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.137.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.138.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.138.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.138.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.139.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.139.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.139.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.14.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.14.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.14.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.140.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.140.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.140.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.141.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.141.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.141.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.142.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.142.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.142.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.143.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.143.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.143.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.144.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.144.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.144.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.145.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.145.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.145.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.146.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.146.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.146.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.147.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.147.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.147.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.148.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.148.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.148.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.149.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.149.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.149.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.15.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.15.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.15.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.150.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.150.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.150.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.151.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.151.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.151.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.152.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.152.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.152.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.153.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.153.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.153.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.154.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.154.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.154.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.155.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.155.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.155.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.156.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.156.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.156.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.157.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.157.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.157.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.158.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.158.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.158.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.159.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.159.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.159.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.experts.16.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.16.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.16.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.17.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.17.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.17.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.18.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.18.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.18.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.19.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.19.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.19.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.2.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.2.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.20.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.20.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.20.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.21.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.21.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.21.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.22.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.22.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.22.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.23.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.23.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.23.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.24.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.24.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.24.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.25.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.25.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.25.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.26.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.26.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.26.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.27.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.27.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.27.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.28.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.28.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.28.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.29.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.29.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.29.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.3.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.3.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.30.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.30.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.30.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.31.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.31.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.31.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.32.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.32.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.32.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.33.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.33.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.33.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.34.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.34.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.34.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.35.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.35.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.35.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.36.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.36.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.36.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.37.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.37.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.37.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.38.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.38.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.38.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.39.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.39.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.39.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.4.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.4.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.40.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.40.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.40.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.41.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.41.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.41.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.42.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.42.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.42.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.43.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.43.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.43.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.44.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.44.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.44.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.45.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.45.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.45.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.46.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.46.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.46.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.47.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.47.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.47.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.48.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.48.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.48.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.49.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.49.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.49.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.5.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.5.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.50.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.50.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.50.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.51.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.51.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.51.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.52.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.52.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.52.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.53.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.53.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.53.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.54.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.54.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.54.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.55.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.55.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.55.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.56.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.56.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.56.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.57.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.57.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.57.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.58.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.58.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.58.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.59.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.59.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.59.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.6.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.6.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.60.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.60.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.60.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.61.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.61.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.61.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.62.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.62.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.62.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.63.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.63.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.63.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.64.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.64.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.64.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.65.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.65.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.65.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.66.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.66.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.66.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.67.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.67.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.67.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.68.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.68.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.68.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.69.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.69.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.69.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.7.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.7.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.70.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.70.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.70.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.71.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.71.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.71.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.72.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.72.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.72.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.73.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.73.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.73.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.74.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.74.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.74.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.75.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.75.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.75.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.76.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.76.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.76.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.77.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.77.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.77.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.78.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.78.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.78.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.79.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.79.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.79.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.8.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.8.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.8.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.80.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.80.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.80.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.81.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.81.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.81.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.82.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.82.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.82.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.83.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.83.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.83.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.84.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.84.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.84.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.85.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.85.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.85.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.86.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.86.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.86.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.87.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.87.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.87.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.88.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.88.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.88.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.89.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.89.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.89.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.9.down_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.9.gate_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.9.up_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.mlp.experts.90.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.90.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.90.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.91.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.91.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.91.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.92.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.92.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.92.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.93.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.93.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.93.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.94.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.94.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.94.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.95.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.95.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.95.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.96.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.96.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.96.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.97.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.97.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.97.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.98.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.98.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.98.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.99.down_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.99.gate_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.experts.99.up_proj.weight": "model-00043-of-00142.safetensors", + "model.layers.29.mlp.gate.e_score_correction_bias": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.gate.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.shared_experts.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.shared_experts.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.mlp.shared_experts.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00044-of-00142.safetensors", + "model.layers.29.self_attn.k_norm.weight": "model-00042-of-00142.safetensors", + "model.layers.29.self_attn.k_proj.bias": "model-00042-of-00142.safetensors", + "model.layers.29.self_attn.k_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.self_attn.q_norm.weight": "model-00042-of-00142.safetensors", + "model.layers.29.self_attn.q_proj.bias": "model-00042-of-00142.safetensors", + "model.layers.29.self_attn.q_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.29.self_attn.v_proj.bias": "model-00042-of-00142.safetensors", + "model.layers.29.self_attn.v_proj.weight": "model-00042-of-00142.safetensors", + "model.layers.3.input_layernorm.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.0.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.0.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.1.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.1.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.10.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.10.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.10.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.100.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.100.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.100.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.101.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.101.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.101.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.102.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.102.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.102.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.103.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.103.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.103.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.104.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.104.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.104.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.105.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.105.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.105.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.106.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.106.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.106.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.107.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.107.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.107.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.108.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.108.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.108.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.109.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.109.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.109.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.11.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.11.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.11.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.110.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.110.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.110.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.111.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.111.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.111.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.112.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.112.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.112.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.113.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.113.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.113.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.114.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.114.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.114.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.115.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.115.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.115.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.116.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.116.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.116.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.117.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.117.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.117.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.118.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.118.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.118.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.119.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.119.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.119.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.12.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.12.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.12.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.120.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.120.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.120.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.121.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.121.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.121.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.122.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.122.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.122.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.123.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.123.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.123.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.124.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.124.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.124.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.125.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.125.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.125.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.126.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.126.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.126.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.127.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.127.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.127.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.128.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.128.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.128.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.129.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.129.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.129.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.13.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.13.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.13.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.130.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.130.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.130.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.131.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.131.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.131.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.132.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.132.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.132.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.133.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.133.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.133.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.134.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.134.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.134.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.135.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.135.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.135.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.136.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.136.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.136.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.137.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.137.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.137.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.138.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.138.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.138.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.139.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.139.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.139.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.14.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.14.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.14.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.140.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.140.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.140.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.141.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.141.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.141.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.142.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.142.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.142.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.143.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.143.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.143.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.144.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.144.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.144.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.145.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.145.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.145.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.146.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.146.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.146.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.147.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.147.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.147.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.148.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.148.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.148.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.149.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.149.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.149.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.15.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.15.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.15.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.150.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.150.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.150.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.151.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.151.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.151.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.152.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.152.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.152.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.153.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.153.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.153.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.154.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.154.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.154.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.155.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.155.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.155.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.156.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.156.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.156.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.157.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.157.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.157.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.158.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.158.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.158.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.159.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.159.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.159.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.experts.16.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.16.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.16.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.17.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.17.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.17.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.18.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.18.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.18.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.19.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.19.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.19.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.2.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.2.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.20.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.20.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.20.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.21.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.21.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.21.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.22.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.22.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.22.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.23.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.23.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.23.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.24.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.24.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.24.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.25.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.25.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.25.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.26.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.26.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.26.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.27.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.27.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.27.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.28.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.28.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.28.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.29.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.29.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.29.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.3.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.3.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.30.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.30.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.30.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.31.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.31.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.31.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.32.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.32.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.32.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.33.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.33.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.33.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.34.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.34.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.34.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.35.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.35.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.35.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.36.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.36.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.36.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.37.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.37.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.37.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.38.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.38.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.38.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.39.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.39.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.39.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.4.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.4.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.40.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.40.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.40.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.41.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.41.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.41.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.42.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.42.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.42.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.43.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.43.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.43.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.44.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.44.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.44.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.45.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.45.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.45.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.46.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.46.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.46.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.47.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.47.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.47.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.48.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.48.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.48.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.49.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.49.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.49.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.5.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.5.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.50.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.50.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.50.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.51.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.51.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.51.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.52.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.52.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.52.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.53.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.53.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.53.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.54.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.54.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.54.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.55.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.55.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.55.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.56.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.56.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.56.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.57.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.57.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.57.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.58.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.58.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.58.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.59.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.59.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.59.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.6.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.6.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.60.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.60.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.60.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.61.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.61.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.61.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.62.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.62.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.62.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.63.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.63.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.64.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.64.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.65.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.65.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.65.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.66.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.66.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.66.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.67.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.67.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.67.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.68.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.68.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.68.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.69.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.69.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.69.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.7.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.7.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.70.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.70.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.70.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.71.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.71.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.71.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.72.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.72.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.72.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.73.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.73.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.73.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.74.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.74.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.74.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.75.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.75.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.75.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.76.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.76.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.76.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.77.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.77.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.77.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.78.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.78.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.78.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.79.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.79.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.79.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.8.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.8.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.8.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.80.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.80.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.80.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.81.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.81.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.81.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.82.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.82.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.82.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.83.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.83.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.83.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.84.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.84.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.84.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.85.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.85.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.85.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.86.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.86.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.86.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.87.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.87.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.87.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.88.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.88.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.88.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.89.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.89.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.89.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.9.down_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.9.gate_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.9.up_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.mlp.experts.90.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.90.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.90.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.91.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.91.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.91.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.92.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.92.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.92.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.93.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.93.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.93.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.94.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.94.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.94.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.95.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.95.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.95.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.96.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.96.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.96.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.97.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.97.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.97.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.98.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.98.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.98.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.99.down_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.99.gate_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.experts.99.up_proj.weight": "model-00002-of-00142.safetensors", + "model.layers.3.mlp.gate.e_score_correction_bias": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.gate.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.shared_experts.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.shared_experts.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.mlp.shared_experts.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00003-of-00142.safetensors", + "model.layers.3.self_attn.k_norm.weight": "model-00001-of-00142.safetensors", + "model.layers.3.self_attn.k_proj.bias": "model-00001-of-00142.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.self_attn.q_norm.weight": "model-00001-of-00142.safetensors", + "model.layers.3.self_attn.q_proj.bias": "model-00001-of-00142.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.3.self_attn.v_proj.bias": "model-00001-of-00142.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00142.safetensors", + "model.layers.30.input_layernorm.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.0.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.0.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.0.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.1.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.1.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.1.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.10.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.10.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.10.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.100.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.100.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.100.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.101.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.101.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.101.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.102.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.102.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.102.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.103.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.103.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.103.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.104.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.104.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.104.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.105.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.105.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.105.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.106.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.106.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.106.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.107.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.107.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.107.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.108.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.108.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.108.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.109.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.109.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.109.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.11.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.11.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.11.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.110.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.110.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.110.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.111.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.111.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.111.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.112.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.112.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.112.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.113.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.113.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.113.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.114.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.114.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.114.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.115.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.115.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.115.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.116.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.116.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.116.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.117.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.117.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.117.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.118.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.118.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.118.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.119.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.119.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.119.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.12.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.12.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.12.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.120.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.120.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.120.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.121.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.121.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.121.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.122.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.122.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.122.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.123.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.123.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.123.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.124.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.124.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.124.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.125.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.125.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.125.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.126.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.126.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.126.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.127.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.127.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.127.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.128.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.128.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.128.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.129.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.129.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.129.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.13.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.13.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.13.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.130.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.130.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.130.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.131.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.131.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.131.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.132.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.132.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.132.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.133.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.133.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.133.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.134.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.134.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.134.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.135.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.135.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.135.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.136.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.136.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.136.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.137.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.137.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.137.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.138.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.138.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.138.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.139.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.139.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.139.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.14.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.14.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.14.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.140.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.140.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.140.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.141.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.141.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.141.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.142.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.142.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.142.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.143.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.143.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.143.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.144.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.144.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.144.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.145.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.145.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.145.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.146.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.146.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.146.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.147.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.147.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.147.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.148.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.148.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.148.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.149.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.149.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.149.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.15.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.15.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.15.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.150.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.150.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.150.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.151.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.151.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.151.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.152.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.152.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.152.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.153.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.153.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.153.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.154.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.154.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.154.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.155.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.155.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.155.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.156.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.156.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.156.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.157.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.157.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.157.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.158.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.158.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.158.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.159.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.159.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.159.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.16.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.16.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.16.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.17.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.17.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.17.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.18.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.18.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.18.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.19.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.19.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.19.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.2.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.2.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.2.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.20.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.20.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.20.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.21.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.21.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.21.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.22.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.22.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.22.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.23.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.23.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.23.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.24.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.24.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.24.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.25.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.25.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.25.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.26.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.26.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.26.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.27.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.27.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.27.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.28.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.28.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.28.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.29.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.29.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.29.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.3.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.3.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.3.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.30.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.30.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.30.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.31.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.31.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.31.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.32.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.32.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.32.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.33.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.33.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.33.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.34.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.34.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.34.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.35.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.35.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.35.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.36.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.36.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.36.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.37.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.37.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.37.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.38.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.38.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.38.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.39.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.39.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.39.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.4.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.4.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.4.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.40.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.40.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.40.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.41.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.41.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.41.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.42.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.42.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.42.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.43.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.43.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.43.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.44.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.44.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.44.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.45.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.45.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.45.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.46.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.46.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.46.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.47.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.47.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.47.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.48.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.48.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.48.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.49.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.49.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.49.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.5.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.5.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.5.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.50.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.50.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.50.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.51.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.51.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.51.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.52.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.52.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.52.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.53.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.53.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.53.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.54.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.54.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.54.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.55.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.55.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.55.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.56.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.56.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.56.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.57.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.57.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.57.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.58.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.58.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.58.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.59.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.59.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.59.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.6.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.6.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.6.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.60.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.60.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.60.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.61.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.61.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.61.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.62.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.62.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.62.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.63.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.63.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.63.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.64.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.64.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.64.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.65.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.65.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.65.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.66.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.66.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.66.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.67.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.67.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.67.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.68.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.68.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.68.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.69.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.69.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.69.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.7.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.7.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.7.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.70.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.70.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.70.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.71.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.71.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.71.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.72.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.72.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.72.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.73.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.73.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.73.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.74.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.74.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.74.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.75.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.75.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.75.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.76.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.76.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.76.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.77.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.77.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.77.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.78.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.78.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.78.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.79.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.79.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.79.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.8.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.8.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.8.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.80.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.80.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.80.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.81.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.81.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.81.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.82.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.82.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.82.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.83.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.83.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.83.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.84.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.84.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.84.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.85.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.85.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.85.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.86.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.86.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.86.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.87.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.87.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.87.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.88.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.88.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.88.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.89.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.89.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.89.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.9.down_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.9.gate_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.9.up_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.mlp.experts.90.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.90.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.90.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.91.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.91.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.91.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.92.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.92.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.92.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.93.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.93.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.93.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.94.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.94.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.94.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.95.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.95.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.95.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.96.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.96.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.96.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.97.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.97.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.97.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.98.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.98.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.98.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.99.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.99.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.experts.99.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.gate.e_score_correction_bias": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.gate.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.shared_experts.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.shared_experts.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.mlp.shared_experts.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00045-of-00142.safetensors", + "model.layers.30.self_attn.k_norm.weight": "model-00044-of-00142.safetensors", + "model.layers.30.self_attn.k_proj.bias": "model-00044-of-00142.safetensors", + "model.layers.30.self_attn.k_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.self_attn.q_norm.weight": "model-00044-of-00142.safetensors", + "model.layers.30.self_attn.q_proj.bias": "model-00044-of-00142.safetensors", + "model.layers.30.self_attn.q_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.30.self_attn.v_proj.bias": "model-00044-of-00142.safetensors", + "model.layers.30.self_attn.v_proj.weight": "model-00044-of-00142.safetensors", + "model.layers.31.input_layernorm.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.0.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.0.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.1.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.1.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.10.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.10.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.10.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.100.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.100.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.100.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.101.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.101.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.101.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.102.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.102.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.102.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.103.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.103.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.103.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.104.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.104.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.104.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.105.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.105.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.105.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.106.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.106.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.106.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.107.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.107.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.107.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.108.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.108.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.108.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.109.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.109.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.109.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.11.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.11.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.11.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.110.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.110.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.110.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.111.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.111.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.111.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.112.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.112.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.112.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.113.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.113.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.113.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.114.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.114.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.114.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.115.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.115.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.115.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.116.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.116.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.116.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.117.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.117.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.117.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.118.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.118.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.118.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.119.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.119.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.119.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.12.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.12.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.12.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.120.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.120.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.120.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.121.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.121.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.121.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.122.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.122.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.122.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.123.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.123.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.123.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.124.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.124.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.124.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.125.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.125.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.125.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.126.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.126.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.126.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.127.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.127.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.127.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.128.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.128.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.128.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.129.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.129.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.129.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.13.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.13.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.13.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.130.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.130.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.130.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.131.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.131.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.131.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.132.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.132.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.132.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.133.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.133.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.133.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.134.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.134.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.134.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.135.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.135.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.135.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.136.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.136.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.136.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.137.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.137.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.137.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.138.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.138.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.138.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.139.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.139.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.139.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.14.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.14.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.14.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.140.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.140.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.140.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.141.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.141.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.141.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.142.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.142.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.142.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.143.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.143.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.143.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.144.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.144.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.144.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.145.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.145.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.145.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.146.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.146.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.146.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.147.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.147.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.147.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.148.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.148.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.148.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.149.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.149.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.149.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.15.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.15.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.15.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.150.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.150.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.150.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.151.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.151.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.151.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.152.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.152.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.152.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.153.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.153.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.153.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.154.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.154.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.154.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.155.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.155.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.155.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.156.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.156.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.156.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.157.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.157.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.157.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.158.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.158.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.158.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.159.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.159.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.159.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.experts.16.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.16.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.16.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.17.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.17.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.17.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.18.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.18.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.18.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.19.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.19.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.19.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.2.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.2.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.20.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.20.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.20.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.21.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.21.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.21.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.22.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.22.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.22.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.23.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.23.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.23.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.24.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.24.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.24.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.25.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.25.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.25.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.26.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.26.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.26.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.27.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.27.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.27.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.28.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.28.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.28.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.29.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.29.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.29.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.3.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.3.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.30.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.30.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.30.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.31.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.31.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.31.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.32.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.32.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.32.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.33.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.33.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.33.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.34.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.34.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.34.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.35.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.35.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.35.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.36.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.36.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.36.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.37.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.37.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.37.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.38.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.38.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.38.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.39.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.39.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.39.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.4.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.4.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.40.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.40.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.40.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.41.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.41.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.41.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.42.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.42.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.42.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.43.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.43.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.43.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.44.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.44.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.44.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.45.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.45.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.45.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.46.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.46.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.46.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.47.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.47.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.47.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.48.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.48.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.48.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.49.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.49.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.49.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.5.down_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.5.up_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.50.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.50.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.50.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.51.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.51.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.51.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.52.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.52.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.52.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.53.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.53.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.53.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.54.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.54.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.54.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.55.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.55.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.55.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.56.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.56.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.56.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.57.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.57.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.57.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.58.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.58.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.58.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.59.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.59.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.59.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.6.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.mlp.experts.6.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.60.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.60.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.60.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.61.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.61.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.61.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.62.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.62.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.62.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.63.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.63.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.63.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.64.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.64.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.64.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.65.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.65.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.65.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.66.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.66.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.66.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.67.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.67.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.67.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.68.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.68.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.68.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.69.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.69.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.69.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.7.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.7.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.70.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.70.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.70.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.71.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.71.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.71.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.72.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.72.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.72.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.73.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.73.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.73.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.74.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.74.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.74.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.75.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.75.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.75.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.76.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.76.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.76.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.77.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.77.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.77.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.78.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.78.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.78.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.79.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.79.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.79.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.8.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.8.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.8.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.80.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.80.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.80.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.81.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.81.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.81.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.82.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.82.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.82.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.83.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.83.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.83.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.84.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.84.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.84.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.85.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.85.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.85.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.86.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.86.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.86.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.87.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.87.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.87.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.88.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.88.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.88.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.89.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.89.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.89.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.9.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.9.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.9.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.90.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.90.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.90.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.91.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.91.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.91.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.92.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.92.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.92.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.93.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.93.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.93.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.94.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.94.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.94.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.95.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.95.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.95.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.96.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.96.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.96.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.97.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.97.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.97.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.98.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.98.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.98.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.99.down_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.99.gate_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.experts.99.up_proj.weight": "model-00046-of-00142.safetensors", + "model.layers.31.mlp.gate.e_score_correction_bias": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.gate.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.shared_experts.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.shared_experts.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.mlp.shared_experts.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00047-of-00142.safetensors", + "model.layers.31.self_attn.k_norm.weight": "model-00045-of-00142.safetensors", + "model.layers.31.self_attn.k_proj.bias": "model-00045-of-00142.safetensors", + "model.layers.31.self_attn.k_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.self_attn.q_norm.weight": "model-00045-of-00142.safetensors", + "model.layers.31.self_attn.q_proj.bias": "model-00045-of-00142.safetensors", + "model.layers.31.self_attn.q_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.31.self_attn.v_proj.bias": "model-00045-of-00142.safetensors", + "model.layers.31.self_attn.v_proj.weight": "model-00045-of-00142.safetensors", + "model.layers.32.input_layernorm.weight": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.experts.0.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.0.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.0.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.1.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.1.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.1.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.10.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.10.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.10.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.100.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.100.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.100.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.101.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.101.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.101.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.102.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.102.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.102.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.103.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.103.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.103.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.104.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.104.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.104.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.105.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.105.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.105.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.106.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.106.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.106.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.107.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.107.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.107.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.108.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.108.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.108.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.109.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.109.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.109.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.11.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.11.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.11.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.110.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.110.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.110.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.111.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.111.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.111.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.112.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.112.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.112.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.113.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.113.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.113.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.114.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.114.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.114.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.115.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.115.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.115.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.116.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.116.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.116.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.117.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.117.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.117.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.118.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.118.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.118.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.119.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.119.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.119.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.12.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.12.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.12.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.120.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.120.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.120.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.121.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.121.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.121.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.122.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.122.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.122.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.123.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.123.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.123.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.124.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.124.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.124.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.125.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.125.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.125.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.126.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.126.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.126.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.127.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.127.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.127.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.128.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.128.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.128.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.129.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.129.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.129.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.13.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.13.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.13.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.130.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.130.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.130.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.131.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.131.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.131.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.132.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.132.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.132.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.133.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.133.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.133.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.134.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.134.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.134.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.135.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.135.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.135.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.136.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.136.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.136.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.137.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.137.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.137.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.138.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.138.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.138.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.139.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.139.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.139.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.14.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.14.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.14.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.140.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.140.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.140.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.141.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.141.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.141.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.142.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.142.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.142.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.143.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.143.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.143.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.144.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.144.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.144.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.145.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.145.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.145.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.146.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.146.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.146.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.147.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.147.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.147.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.148.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.148.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.148.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.149.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.149.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.149.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.15.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.15.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.15.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.150.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.150.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.150.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.151.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.151.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.151.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.152.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.152.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.152.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.153.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.153.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.153.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.154.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.154.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.154.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.155.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.155.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.155.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.156.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.experts.156.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.156.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.157.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.experts.157.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.experts.157.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.experts.158.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.experts.158.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.experts.158.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.experts.159.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.experts.159.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.experts.159.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.experts.16.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.16.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.16.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.17.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.17.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.17.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.18.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.18.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.18.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.19.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.19.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.19.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.2.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.2.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.2.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.20.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.20.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.20.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.21.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.21.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.21.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.22.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.22.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.22.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.23.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.23.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.23.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.24.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.24.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.24.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.25.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.25.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.25.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.26.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.26.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.26.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.27.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.27.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.27.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.28.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.28.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.28.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.29.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.29.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.29.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.3.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.3.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.3.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.30.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.30.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.30.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.31.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.31.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.31.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.32.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.32.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.32.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.33.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.33.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.33.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.34.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.34.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.34.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.35.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.35.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.35.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.36.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.36.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.36.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.37.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.37.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.37.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.38.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.38.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.38.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.39.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.39.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.39.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.4.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.4.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.4.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.40.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.40.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.40.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.41.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.41.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.41.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.42.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.42.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.42.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.43.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.43.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.43.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.44.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.44.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.44.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.45.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.45.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.45.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.46.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.46.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.46.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.47.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.47.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.47.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.48.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.48.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.48.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.49.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.49.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.49.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.5.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.5.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.5.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.50.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.50.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.50.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.51.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.51.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.51.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.52.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.52.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.52.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.53.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.53.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.53.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.54.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.54.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.54.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.55.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.55.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.55.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.56.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.56.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.56.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.57.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.57.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.57.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.58.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.58.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.58.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.59.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.59.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.59.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.6.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.6.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.6.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.60.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.60.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.60.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.61.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.61.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.61.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.62.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.62.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.62.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.63.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.63.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.63.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.64.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.64.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.64.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.65.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.65.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.65.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.66.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.66.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.66.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.67.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.67.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.67.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.68.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.68.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.68.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.69.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.69.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.69.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.7.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.7.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.7.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.70.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.70.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.70.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.71.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.71.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.71.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.72.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.72.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.72.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.73.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.73.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.73.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.74.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.74.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.74.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.75.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.75.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.75.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.76.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.76.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.76.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.77.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.77.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.77.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.78.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.78.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.78.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.79.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.79.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.79.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.8.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.8.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.8.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.80.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.80.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.80.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.81.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.81.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.81.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.82.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.82.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.82.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.83.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.83.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.83.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.84.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.84.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.84.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.85.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.85.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.85.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.86.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.86.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.86.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.87.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.87.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.87.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.88.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.88.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.88.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.89.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.89.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.89.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.9.down_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.9.gate_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.9.up_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.mlp.experts.90.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.90.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.90.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.91.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.91.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.91.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.92.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.92.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.92.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.93.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.93.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.93.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.94.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.94.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.94.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.95.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.95.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.95.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.96.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.96.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.96.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.97.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.97.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.97.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.98.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.98.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.98.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.99.down_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.99.gate_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.experts.99.up_proj.weight": "model-00048-of-00142.safetensors", + "model.layers.32.mlp.gate.e_score_correction_bias": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.gate.weight": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.shared_experts.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.shared_experts.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.32.mlp.shared_experts.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00049-of-00142.safetensors", + "model.layers.32.self_attn.k_norm.weight": "model-00047-of-00142.safetensors", + "model.layers.32.self_attn.k_proj.bias": "model-00047-of-00142.safetensors", + "model.layers.32.self_attn.k_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.self_attn.q_norm.weight": "model-00047-of-00142.safetensors", + "model.layers.32.self_attn.q_proj.bias": "model-00047-of-00142.safetensors", + "model.layers.32.self_attn.q_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.32.self_attn.v_proj.bias": "model-00047-of-00142.safetensors", + "model.layers.32.self_attn.v_proj.weight": "model-00047-of-00142.safetensors", + "model.layers.33.input_layernorm.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.0.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.0.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.1.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.1.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.10.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.10.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.10.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.100.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.100.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.100.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.101.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.101.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.101.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.102.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.102.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.102.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.103.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.103.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.103.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.104.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.104.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.104.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.105.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.105.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.105.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.106.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.106.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.106.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.107.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.107.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.107.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.108.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.108.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.108.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.109.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.109.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.109.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.11.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.11.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.11.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.110.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.110.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.110.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.111.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.111.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.111.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.112.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.112.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.112.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.113.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.113.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.113.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.114.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.114.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.114.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.115.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.115.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.115.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.116.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.116.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.116.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.117.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.117.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.117.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.118.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.118.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.118.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.119.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.119.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.119.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.12.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.12.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.12.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.120.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.120.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.120.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.121.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.121.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.121.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.122.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.122.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.122.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.123.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.123.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.123.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.124.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.124.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.124.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.125.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.125.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.125.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.126.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.126.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.126.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.127.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.127.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.127.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.128.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.128.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.128.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.129.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.129.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.129.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.13.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.13.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.13.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.130.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.130.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.130.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.131.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.131.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.131.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.132.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.132.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.132.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.133.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.133.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.133.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.134.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.134.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.134.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.135.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.135.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.135.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.136.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.136.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.136.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.137.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.137.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.137.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.138.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.138.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.138.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.139.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.139.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.139.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.14.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.14.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.14.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.140.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.140.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.140.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.141.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.141.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.141.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.142.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.142.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.142.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.143.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.143.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.143.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.144.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.144.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.144.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.145.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.145.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.145.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.146.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.146.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.146.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.147.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.147.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.147.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.148.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.148.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.148.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.149.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.149.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.149.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.15.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.15.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.15.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.150.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.150.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.150.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.151.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.151.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.151.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.152.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.152.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.152.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.153.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.153.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.153.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.154.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.154.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.154.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.155.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.155.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.155.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.156.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.156.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.156.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.157.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.157.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.157.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.158.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.158.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.158.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.159.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.159.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.159.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.16.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.16.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.16.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.17.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.17.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.17.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.18.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.18.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.18.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.19.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.19.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.19.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.2.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.2.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.20.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.20.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.20.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.21.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.21.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.21.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.22.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.22.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.22.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.23.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.23.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.23.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.24.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.24.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.24.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.25.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.25.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.25.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.26.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.26.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.26.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.27.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.27.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.27.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.28.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.28.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.28.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.29.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.29.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.29.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.3.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.3.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.30.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.30.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.30.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.31.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.31.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.31.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.32.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.32.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.32.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.33.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.33.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.33.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.34.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.34.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.34.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.35.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.35.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.35.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.36.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.36.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.36.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.37.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.37.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.37.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.38.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.38.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.38.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.39.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.39.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.39.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.4.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.4.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.40.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.40.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.40.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.41.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.41.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.41.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.42.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.42.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.42.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.43.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.43.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.43.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.44.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.44.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.44.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.45.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.45.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.45.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.46.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.46.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.46.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.47.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.47.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.47.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.48.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.48.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.48.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.49.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.49.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.49.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.5.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.5.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.50.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.50.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.50.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.51.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.51.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.51.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.52.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.52.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.52.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.53.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.53.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.53.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.54.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.54.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.54.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.55.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.55.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.55.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.56.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.56.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.56.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.57.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.57.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.57.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.58.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.58.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.58.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.59.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.59.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.59.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.6.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.6.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.60.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.60.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.60.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.61.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.61.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.61.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.62.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.62.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.62.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.63.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.63.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.63.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.64.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.64.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.64.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.65.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.65.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.65.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.66.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.66.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.66.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.67.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.67.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.67.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.68.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.68.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.68.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.69.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.69.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.69.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.7.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.7.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.70.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.70.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.70.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.71.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.71.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.71.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.72.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.72.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.72.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.73.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.73.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.73.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.74.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.74.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.74.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.75.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.75.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.75.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.76.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.76.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.76.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.77.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.77.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.77.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.78.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.78.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.78.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.79.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.79.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.79.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.8.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.8.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.8.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.80.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.80.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.80.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.81.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.81.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.81.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.82.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.82.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.82.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.83.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.83.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.83.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.84.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.84.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.84.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.85.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.85.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.85.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.86.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.86.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.86.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.87.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.87.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.87.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.88.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.88.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.88.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.89.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.89.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.89.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.9.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.9.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.9.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.90.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.90.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.90.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.91.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.91.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.91.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.92.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.92.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.92.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.93.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.93.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.93.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.94.down_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.94.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.94.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.95.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.95.gate_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.95.up_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.mlp.experts.96.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.96.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.96.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.97.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.97.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.97.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.98.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.98.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.98.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.99.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.99.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.experts.99.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.gate.e_score_correction_bias": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.gate.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.shared_experts.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.shared_experts.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.mlp.shared_experts.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00050-of-00142.safetensors", + "model.layers.33.self_attn.k_norm.weight": "model-00049-of-00142.safetensors", + "model.layers.33.self_attn.k_proj.bias": "model-00049-of-00142.safetensors", + "model.layers.33.self_attn.k_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.self_attn.q_norm.weight": "model-00049-of-00142.safetensors", + "model.layers.33.self_attn.q_proj.bias": "model-00049-of-00142.safetensors", + "model.layers.33.self_attn.q_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.33.self_attn.v_proj.bias": "model-00049-of-00142.safetensors", + "model.layers.33.self_attn.v_proj.weight": "model-00049-of-00142.safetensors", + "model.layers.34.input_layernorm.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.0.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.0.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.0.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.1.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.1.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.1.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.10.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.10.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.10.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.100.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.100.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.100.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.101.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.101.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.101.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.102.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.102.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.102.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.103.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.103.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.103.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.104.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.104.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.104.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.105.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.105.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.105.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.106.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.106.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.106.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.107.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.107.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.107.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.108.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.108.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.108.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.109.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.109.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.109.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.11.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.11.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.11.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.110.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.110.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.110.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.111.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.111.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.111.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.112.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.112.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.112.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.113.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.113.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.113.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.114.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.114.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.114.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.115.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.115.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.115.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.116.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.116.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.116.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.117.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.117.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.117.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.118.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.118.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.118.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.119.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.119.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.119.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.12.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.12.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.12.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.120.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.120.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.120.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.121.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.121.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.121.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.122.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.122.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.122.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.123.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.123.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.123.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.124.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.124.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.124.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.125.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.125.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.125.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.126.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.126.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.126.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.127.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.127.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.127.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.128.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.128.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.128.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.129.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.129.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.129.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.13.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.13.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.13.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.130.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.130.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.130.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.131.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.131.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.131.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.132.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.132.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.132.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.133.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.133.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.133.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.134.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.134.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.134.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.135.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.135.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.135.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.136.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.136.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.136.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.137.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.137.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.137.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.138.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.138.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.138.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.139.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.139.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.139.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.14.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.14.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.14.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.140.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.140.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.140.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.141.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.141.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.141.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.142.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.142.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.142.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.143.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.143.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.143.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.144.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.144.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.144.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.145.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.145.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.145.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.146.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.146.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.146.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.147.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.147.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.147.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.148.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.148.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.148.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.149.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.149.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.149.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.15.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.15.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.15.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.150.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.150.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.150.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.151.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.151.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.151.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.152.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.152.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.152.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.153.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.153.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.153.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.154.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.154.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.154.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.155.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.155.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.155.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.156.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.156.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.156.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.157.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.157.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.157.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.158.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.158.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.158.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.159.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.159.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.159.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.experts.16.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.16.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.16.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.17.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.17.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.17.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.18.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.18.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.18.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.19.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.19.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.19.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.2.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.2.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.2.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.20.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.20.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.20.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.21.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.21.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.21.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.22.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.22.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.22.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.23.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.23.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.23.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.24.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.24.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.24.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.25.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.25.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.25.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.26.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.26.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.26.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.27.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.27.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.27.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.28.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.28.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.28.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.29.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.29.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.29.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.3.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.3.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.3.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.30.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.30.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.30.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.31.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.31.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.31.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.32.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.32.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.32.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.33.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.33.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.33.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.34.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.34.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.34.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.35.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.35.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.35.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.36.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.36.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.36.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.37.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.37.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.37.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.38.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.38.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.38.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.39.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.39.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.39.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.4.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.4.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.4.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.40.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.40.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.40.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.41.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.41.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.41.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.42.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.42.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.42.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.43.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.43.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.43.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.44.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.44.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.44.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.45.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.45.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.45.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.46.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.46.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.46.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.47.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.47.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.47.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.48.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.48.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.48.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.49.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.49.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.49.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.5.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.5.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.5.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.50.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.50.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.50.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.51.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.51.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.51.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.52.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.52.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.52.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.53.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.53.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.53.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.54.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.54.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.54.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.55.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.55.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.55.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.56.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.56.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.56.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.57.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.57.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.57.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.58.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.58.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.58.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.59.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.59.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.59.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.6.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.6.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.6.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.60.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.60.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.60.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.61.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.61.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.61.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.62.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.62.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.62.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.63.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.63.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.63.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.64.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.64.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.64.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.65.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.65.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.65.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.66.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.66.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.66.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.67.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.67.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.67.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.68.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.68.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.68.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.69.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.69.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.69.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.7.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.7.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.7.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.70.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.70.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.70.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.71.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.71.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.71.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.72.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.72.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.72.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.73.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.73.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.73.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.74.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.74.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.74.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.75.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.75.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.75.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.76.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.76.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.76.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.77.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.77.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.77.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.78.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.78.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.78.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.79.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.79.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.79.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.8.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.8.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.8.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.80.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.80.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.80.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.81.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.81.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.81.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.82.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.82.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.82.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.83.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.83.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.83.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.84.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.84.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.84.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.85.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.85.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.85.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.86.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.86.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.86.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.87.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.87.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.87.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.88.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.88.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.88.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.89.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.89.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.89.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.9.down_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.9.gate_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.9.up_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.mlp.experts.90.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.90.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.90.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.91.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.91.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.91.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.92.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.92.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.92.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.93.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.93.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.93.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.94.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.94.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.94.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.95.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.95.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.95.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.96.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.96.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.96.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.97.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.97.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.97.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.98.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.98.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.98.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.99.down_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.99.gate_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.experts.99.up_proj.weight": "model-00051-of-00142.safetensors", + "model.layers.34.mlp.gate.e_score_correction_bias": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.gate.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.shared_experts.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.shared_experts.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.mlp.shared_experts.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00052-of-00142.safetensors", + "model.layers.34.self_attn.k_norm.weight": "model-00050-of-00142.safetensors", + "model.layers.34.self_attn.k_proj.bias": "model-00050-of-00142.safetensors", + "model.layers.34.self_attn.k_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.self_attn.q_norm.weight": "model-00050-of-00142.safetensors", + "model.layers.34.self_attn.q_proj.bias": "model-00050-of-00142.safetensors", + "model.layers.34.self_attn.q_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.34.self_attn.v_proj.bias": "model-00050-of-00142.safetensors", + "model.layers.34.self_attn.v_proj.weight": "model-00050-of-00142.safetensors", + "model.layers.35.input_layernorm.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.0.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.0.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.1.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.1.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.10.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.10.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.10.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.100.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.100.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.100.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.101.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.101.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.101.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.102.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.102.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.102.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.103.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.103.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.103.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.104.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.104.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.104.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.105.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.105.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.105.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.106.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.106.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.106.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.107.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.107.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.107.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.108.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.108.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.108.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.109.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.109.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.109.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.11.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.11.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.11.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.110.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.110.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.110.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.111.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.111.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.111.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.112.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.112.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.112.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.113.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.113.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.113.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.114.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.114.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.114.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.115.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.115.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.115.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.116.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.116.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.116.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.117.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.117.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.117.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.118.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.118.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.118.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.119.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.119.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.119.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.12.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.12.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.12.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.120.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.120.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.120.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.121.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.121.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.121.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.122.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.122.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.122.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.123.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.123.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.123.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.124.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.124.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.124.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.125.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.125.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.125.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.126.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.126.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.126.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.127.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.127.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.127.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.128.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.128.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.128.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.129.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.129.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.129.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.13.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.13.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.13.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.130.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.130.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.130.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.131.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.131.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.131.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.132.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.132.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.132.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.133.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.133.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.133.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.134.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.134.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.134.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.135.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.135.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.135.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.136.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.136.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.136.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.137.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.137.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.137.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.138.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.138.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.138.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.139.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.139.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.139.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.14.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.14.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.14.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.140.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.140.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.140.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.141.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.141.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.141.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.142.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.142.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.142.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.143.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.143.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.143.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.144.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.144.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.144.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.145.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.145.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.145.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.146.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.146.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.146.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.147.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.147.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.147.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.148.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.148.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.148.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.149.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.149.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.149.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.15.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.15.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.15.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.150.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.150.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.150.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.151.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.151.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.151.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.152.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.152.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.152.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.153.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.153.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.153.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.154.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.154.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.154.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.155.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.155.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.155.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.156.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.156.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.156.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.157.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.157.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.157.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.158.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.158.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.158.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.159.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.159.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.159.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.16.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.16.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.16.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.17.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.17.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.17.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.18.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.18.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.18.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.19.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.19.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.19.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.2.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.2.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.20.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.20.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.20.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.21.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.21.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.21.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.22.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.22.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.22.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.23.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.23.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.23.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.24.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.24.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.24.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.25.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.25.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.25.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.26.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.26.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.26.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.27.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.27.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.27.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.28.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.28.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.28.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.29.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.29.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.29.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.3.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.3.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.30.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.30.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.30.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.31.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.31.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.31.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.32.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.32.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.32.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.33.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.33.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.33.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.34.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.34.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.34.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.35.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.35.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.35.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.36.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.36.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.36.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.37.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.37.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.37.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.38.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.38.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.38.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.39.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.39.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.39.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.4.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.4.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.40.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.40.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.40.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.41.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.41.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.41.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.42.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.42.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.42.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.43.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.43.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.43.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.44.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.44.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.44.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.45.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.45.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.45.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.46.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.46.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.46.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.47.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.47.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.47.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.48.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.48.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.48.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.49.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.49.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.49.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.5.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.5.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.50.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.50.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.50.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.51.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.51.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.51.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.52.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.52.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.52.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.53.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.53.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.53.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.54.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.54.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.54.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.55.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.55.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.55.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.56.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.56.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.56.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.57.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.57.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.57.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.58.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.58.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.58.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.59.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.59.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.59.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.6.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.6.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.60.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.60.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.60.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.61.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.61.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.61.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.62.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.62.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.62.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.63.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.63.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.63.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.64.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.64.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.64.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.65.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.65.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.65.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.66.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.66.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.66.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.67.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.67.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.67.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.68.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.68.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.68.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.69.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.69.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.69.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.7.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.7.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.70.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.70.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.70.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.71.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.71.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.71.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.72.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.72.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.72.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.73.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.73.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.73.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.74.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.74.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.74.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.75.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.75.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.75.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.76.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.76.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.76.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.77.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.77.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.77.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.78.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.78.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.78.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.79.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.79.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.79.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.8.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.8.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.8.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.80.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.80.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.80.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.81.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.81.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.81.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.82.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.82.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.82.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.83.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.83.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.83.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.84.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.84.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.84.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.85.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.85.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.85.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.86.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.86.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.86.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.87.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.87.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.87.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.88.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.88.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.88.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.89.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.89.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.89.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.9.down_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.9.gate_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.9.up_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.mlp.experts.90.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.90.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.90.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.91.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.91.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.91.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.92.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.92.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.92.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.93.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.93.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.93.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.94.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.94.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.94.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.95.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.95.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.95.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.96.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.96.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.96.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.97.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.97.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.97.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.98.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.98.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.98.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.99.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.99.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.experts.99.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.gate.e_score_correction_bias": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.gate.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.shared_experts.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.shared_experts.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.mlp.shared_experts.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00053-of-00142.safetensors", + "model.layers.35.self_attn.k_norm.weight": "model-00052-of-00142.safetensors", + "model.layers.35.self_attn.k_proj.bias": "model-00052-of-00142.safetensors", + "model.layers.35.self_attn.k_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.self_attn.q_norm.weight": "model-00052-of-00142.safetensors", + "model.layers.35.self_attn.q_proj.bias": "model-00052-of-00142.safetensors", + "model.layers.35.self_attn.q_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.35.self_attn.v_proj.bias": "model-00052-of-00142.safetensors", + "model.layers.35.self_attn.v_proj.weight": "model-00052-of-00142.safetensors", + "model.layers.36.input_layernorm.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.0.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.0.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.0.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.1.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.1.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.1.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.10.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.10.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.10.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.100.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.100.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.100.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.101.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.101.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.101.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.102.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.102.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.102.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.103.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.103.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.103.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.104.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.104.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.104.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.105.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.105.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.105.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.106.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.106.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.106.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.107.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.107.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.107.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.108.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.108.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.108.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.109.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.109.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.109.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.11.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.11.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.11.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.110.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.110.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.110.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.111.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.111.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.111.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.112.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.112.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.112.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.113.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.113.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.113.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.114.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.114.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.114.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.115.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.115.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.115.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.116.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.116.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.116.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.117.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.117.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.117.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.118.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.118.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.118.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.119.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.119.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.119.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.12.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.12.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.12.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.120.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.120.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.120.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.121.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.121.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.121.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.122.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.122.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.122.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.123.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.123.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.123.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.124.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.124.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.124.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.125.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.125.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.125.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.126.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.126.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.126.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.127.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.127.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.127.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.128.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.128.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.128.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.129.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.129.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.129.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.13.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.13.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.13.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.130.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.130.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.130.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.131.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.131.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.131.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.132.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.132.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.132.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.133.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.133.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.133.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.134.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.134.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.134.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.135.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.135.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.135.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.136.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.136.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.136.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.137.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.137.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.137.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.138.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.138.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.138.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.139.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.139.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.139.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.14.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.14.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.14.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.140.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.140.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.140.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.141.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.141.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.141.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.142.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.142.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.142.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.143.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.143.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.143.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.144.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.144.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.144.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.145.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.145.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.145.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.146.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.146.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.146.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.147.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.147.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.147.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.148.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.148.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.148.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.149.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.149.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.149.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.15.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.15.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.15.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.150.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.150.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.150.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.151.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.151.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.151.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.152.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.152.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.152.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.153.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.153.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.153.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.154.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.154.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.154.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.155.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.155.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.155.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.156.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.156.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.156.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.157.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.157.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.157.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.158.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.158.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.158.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.159.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.159.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.159.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.experts.16.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.16.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.16.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.17.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.17.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.17.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.18.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.18.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.18.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.19.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.19.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.19.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.2.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.2.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.2.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.20.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.20.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.20.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.21.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.21.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.21.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.22.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.22.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.22.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.23.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.23.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.23.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.24.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.24.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.24.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.25.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.25.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.25.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.26.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.26.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.26.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.27.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.27.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.27.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.28.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.28.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.28.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.29.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.29.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.29.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.3.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.3.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.3.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.30.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.30.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.30.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.31.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.31.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.31.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.32.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.32.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.32.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.33.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.33.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.33.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.34.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.34.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.34.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.35.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.35.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.35.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.36.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.36.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.36.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.37.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.37.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.37.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.38.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.38.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.38.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.39.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.39.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.39.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.4.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.4.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.4.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.40.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.40.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.40.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.41.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.41.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.41.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.42.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.42.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.42.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.43.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.43.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.43.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.44.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.44.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.44.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.45.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.45.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.45.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.46.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.46.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.46.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.47.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.47.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.47.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.48.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.48.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.48.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.49.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.49.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.49.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.5.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.5.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.5.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.50.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.50.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.50.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.51.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.51.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.51.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.52.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.52.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.52.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.53.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.53.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.53.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.54.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.54.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.54.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.55.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.55.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.55.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.56.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.56.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.56.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.57.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.57.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.57.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.58.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.58.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.58.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.59.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.59.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.59.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.6.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.6.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.6.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.60.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.60.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.60.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.61.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.61.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.61.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.62.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.62.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.62.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.63.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.63.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.63.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.64.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.64.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.64.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.65.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.65.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.65.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.66.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.66.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.66.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.67.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.67.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.67.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.68.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.68.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.68.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.69.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.69.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.69.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.7.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.7.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.7.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.70.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.70.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.70.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.71.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.71.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.71.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.72.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.72.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.72.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.73.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.73.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.73.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.74.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.74.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.74.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.75.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.75.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.75.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.76.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.76.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.76.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.77.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.77.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.77.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.78.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.78.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.78.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.79.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.79.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.79.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.8.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.8.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.8.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.80.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.80.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.80.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.81.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.81.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.81.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.82.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.82.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.82.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.83.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.83.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.83.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.84.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.84.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.84.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.85.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.85.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.85.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.86.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.86.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.86.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.87.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.87.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.87.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.88.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.88.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.88.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.89.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.89.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.89.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.9.down_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.9.gate_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.9.up_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.mlp.experts.90.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.90.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.90.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.91.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.91.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.91.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.92.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.92.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.92.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.93.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.93.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.93.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.94.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.94.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.94.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.95.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.95.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.95.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.96.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.96.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.96.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.97.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.97.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.97.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.98.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.98.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.98.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.99.down_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.99.gate_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.experts.99.up_proj.weight": "model-00054-of-00142.safetensors", + "model.layers.36.mlp.gate.e_score_correction_bias": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.gate.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.shared_experts.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.shared_experts.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.mlp.shared_experts.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.36.post_attention_layernorm.weight": "model-00055-of-00142.safetensors", + "model.layers.36.self_attn.k_norm.weight": "model-00053-of-00142.safetensors", + "model.layers.36.self_attn.k_proj.bias": "model-00053-of-00142.safetensors", + "model.layers.36.self_attn.k_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.self_attn.o_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.self_attn.q_norm.weight": "model-00053-of-00142.safetensors", + "model.layers.36.self_attn.q_proj.bias": "model-00053-of-00142.safetensors", + "model.layers.36.self_attn.q_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.36.self_attn.v_proj.bias": "model-00053-of-00142.safetensors", + "model.layers.36.self_attn.v_proj.weight": "model-00053-of-00142.safetensors", + "model.layers.37.input_layernorm.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.0.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.0.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.1.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.1.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.10.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.10.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.10.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.100.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.100.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.100.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.101.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.101.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.101.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.102.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.102.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.102.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.103.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.103.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.103.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.104.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.104.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.104.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.105.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.105.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.105.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.106.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.106.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.106.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.107.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.107.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.107.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.108.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.108.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.108.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.109.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.109.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.109.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.11.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.11.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.11.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.110.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.110.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.110.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.111.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.111.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.111.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.112.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.112.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.112.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.113.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.113.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.113.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.114.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.114.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.114.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.115.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.115.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.115.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.116.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.116.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.116.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.117.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.117.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.117.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.118.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.118.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.118.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.119.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.119.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.119.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.12.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.12.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.12.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.120.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.120.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.120.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.121.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.121.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.121.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.122.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.122.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.122.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.123.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.123.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.123.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.124.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.124.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.124.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.125.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.125.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.125.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.126.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.126.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.126.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.127.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.127.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.127.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.128.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.128.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.128.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.129.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.129.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.129.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.13.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.13.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.13.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.130.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.130.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.130.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.131.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.131.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.131.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.132.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.132.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.132.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.133.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.133.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.133.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.134.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.134.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.134.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.135.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.135.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.135.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.136.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.136.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.136.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.137.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.137.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.137.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.138.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.138.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.138.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.139.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.139.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.139.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.14.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.14.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.14.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.140.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.140.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.140.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.141.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.141.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.141.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.142.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.142.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.142.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.143.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.143.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.143.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.144.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.144.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.144.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.145.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.145.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.145.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.146.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.146.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.146.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.147.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.147.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.147.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.148.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.148.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.148.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.149.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.149.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.149.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.15.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.15.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.15.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.150.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.150.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.150.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.151.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.151.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.151.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.152.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.152.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.152.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.153.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.153.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.153.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.154.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.154.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.154.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.155.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.155.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.155.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.156.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.156.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.156.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.157.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.157.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.157.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.158.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.158.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.158.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.159.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.159.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.159.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.16.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.16.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.16.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.17.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.17.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.17.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.18.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.18.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.18.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.19.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.19.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.19.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.2.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.2.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.20.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.20.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.20.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.21.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.21.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.21.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.22.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.22.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.22.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.23.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.23.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.23.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.24.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.24.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.24.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.25.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.25.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.25.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.26.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.26.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.26.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.27.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.27.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.27.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.28.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.28.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.28.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.29.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.29.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.29.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.3.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.3.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.30.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.30.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.30.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.31.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.31.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.31.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.32.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.32.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.32.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.33.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.33.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.33.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.34.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.34.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.34.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.35.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.35.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.35.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.36.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.36.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.36.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.37.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.37.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.37.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.38.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.38.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.38.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.39.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.39.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.39.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.4.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.4.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.40.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.40.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.40.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.41.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.41.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.41.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.42.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.42.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.42.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.43.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.43.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.43.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.44.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.44.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.44.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.45.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.45.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.45.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.46.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.46.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.46.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.47.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.47.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.47.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.48.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.48.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.48.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.49.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.49.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.49.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.5.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.5.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.50.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.50.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.50.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.51.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.51.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.51.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.52.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.52.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.52.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.53.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.53.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.53.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.54.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.54.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.54.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.55.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.55.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.55.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.56.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.56.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.56.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.57.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.57.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.57.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.58.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.58.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.58.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.59.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.59.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.59.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.6.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.6.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.60.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.60.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.60.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.61.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.61.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.61.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.62.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.62.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.62.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.63.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.63.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.63.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.64.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.64.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.64.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.65.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.65.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.65.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.66.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.66.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.66.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.67.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.67.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.67.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.68.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.68.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.68.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.69.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.69.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.69.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.7.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.7.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.70.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.70.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.70.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.71.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.71.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.71.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.72.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.72.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.72.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.73.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.73.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.73.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.74.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.74.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.74.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.75.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.75.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.75.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.76.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.76.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.76.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.77.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.77.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.77.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.78.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.78.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.78.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.79.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.79.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.79.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.8.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.8.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.8.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.80.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.80.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.80.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.81.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.81.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.81.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.82.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.82.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.82.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.83.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.83.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.83.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.84.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.84.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.84.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.85.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.85.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.85.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.86.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.86.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.86.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.87.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.87.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.87.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.88.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.88.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.88.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.89.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.89.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.89.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.9.down_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.9.gate_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.9.up_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.mlp.experts.90.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.90.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.90.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.91.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.91.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.91.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.92.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.92.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.92.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.93.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.93.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.93.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.94.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.94.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.94.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.95.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.95.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.95.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.96.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.96.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.96.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.97.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.97.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.97.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.98.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.98.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.98.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.99.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.99.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.experts.99.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.gate.e_score_correction_bias": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.gate.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.shared_experts.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.shared_experts.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.mlp.shared_experts.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.37.post_attention_layernorm.weight": "model-00056-of-00142.safetensors", + "model.layers.37.self_attn.k_norm.weight": "model-00055-of-00142.safetensors", + "model.layers.37.self_attn.k_proj.bias": "model-00055-of-00142.safetensors", + "model.layers.37.self_attn.k_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.self_attn.o_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.self_attn.q_norm.weight": "model-00055-of-00142.safetensors", + "model.layers.37.self_attn.q_proj.bias": "model-00055-of-00142.safetensors", + "model.layers.37.self_attn.q_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.37.self_attn.v_proj.bias": "model-00055-of-00142.safetensors", + "model.layers.37.self_attn.v_proj.weight": "model-00055-of-00142.safetensors", + "model.layers.38.input_layernorm.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.0.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.38.mlp.experts.0.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.38.mlp.experts.0.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.38.mlp.experts.1.down_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.38.mlp.experts.1.gate_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.38.mlp.experts.1.up_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.38.mlp.experts.10.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.10.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.10.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.100.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.100.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.100.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.101.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.101.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.101.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.102.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.102.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.102.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.103.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.103.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.103.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.104.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.104.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.104.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.105.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.105.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.105.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.106.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.106.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.106.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.107.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.107.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.107.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.108.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.108.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.108.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.109.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.109.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.109.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.11.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.11.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.11.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.110.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.110.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.110.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.111.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.111.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.111.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.112.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.112.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.112.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.113.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.113.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.113.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.114.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.114.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.114.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.115.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.115.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.115.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.116.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.116.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.116.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.117.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.117.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.117.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.118.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.118.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.118.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.119.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.119.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.119.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.12.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.12.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.12.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.120.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.120.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.120.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.121.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.121.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.121.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.122.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.122.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.122.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.123.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.123.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.123.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.124.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.124.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.124.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.125.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.125.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.125.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.126.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.126.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.126.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.127.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.127.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.127.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.128.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.128.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.128.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.129.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.129.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.129.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.13.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.13.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.13.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.130.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.130.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.130.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.131.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.131.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.131.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.132.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.132.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.132.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.133.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.133.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.133.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.134.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.134.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.134.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.135.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.135.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.135.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.136.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.136.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.136.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.137.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.137.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.137.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.138.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.138.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.138.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.139.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.139.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.139.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.14.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.14.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.14.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.140.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.140.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.140.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.141.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.141.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.141.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.142.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.142.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.142.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.143.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.143.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.143.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.144.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.144.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.144.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.145.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.145.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.145.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.146.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.146.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.146.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.147.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.147.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.147.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.148.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.148.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.148.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.149.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.149.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.149.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.15.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.15.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.15.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.150.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.150.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.150.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.151.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.151.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.151.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.152.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.152.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.152.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.153.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.153.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.153.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.154.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.154.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.154.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.155.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.155.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.155.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.156.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.156.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.156.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.157.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.157.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.157.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.158.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.158.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.158.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.159.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.159.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.159.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.experts.16.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.16.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.16.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.17.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.17.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.17.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.18.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.18.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.18.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.19.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.19.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.19.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.2.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.2.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.2.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.20.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.20.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.20.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.21.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.21.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.21.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.22.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.22.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.22.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.23.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.23.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.23.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.24.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.24.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.24.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.25.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.25.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.25.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.26.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.26.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.26.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.27.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.27.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.27.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.28.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.28.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.28.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.29.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.29.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.29.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.3.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.3.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.3.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.30.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.30.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.30.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.31.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.31.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.31.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.32.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.32.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.32.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.33.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.33.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.33.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.34.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.34.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.34.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.35.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.35.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.35.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.36.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.36.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.36.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.37.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.37.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.37.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.38.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.38.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.38.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.39.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.39.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.39.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.4.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.4.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.4.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.40.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.40.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.40.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.41.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.41.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.41.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.42.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.42.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.42.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.43.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.43.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.43.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.44.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.44.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.44.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.45.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.45.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.45.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.46.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.46.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.46.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.47.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.47.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.47.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.48.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.48.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.48.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.49.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.49.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.49.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.5.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.5.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.5.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.50.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.50.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.50.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.51.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.51.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.51.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.52.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.52.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.52.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.53.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.53.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.53.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.54.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.54.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.54.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.55.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.55.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.55.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.56.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.56.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.56.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.57.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.57.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.57.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.58.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.58.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.58.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.59.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.59.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.59.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.6.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.6.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.6.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.60.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.60.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.60.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.61.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.61.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.61.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.62.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.62.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.62.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.63.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.63.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.63.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.64.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.64.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.64.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.65.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.65.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.65.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.66.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.66.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.66.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.67.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.67.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.67.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.68.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.68.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.68.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.69.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.69.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.69.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.7.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.7.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.7.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.70.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.70.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.70.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.71.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.71.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.71.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.72.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.72.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.72.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.73.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.73.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.73.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.74.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.74.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.74.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.75.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.75.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.75.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.76.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.76.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.76.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.77.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.77.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.77.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.78.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.78.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.78.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.79.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.79.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.79.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.8.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.8.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.8.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.80.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.80.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.80.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.81.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.81.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.81.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.82.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.82.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.82.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.83.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.83.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.83.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.84.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.84.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.84.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.85.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.85.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.85.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.86.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.86.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.86.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.87.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.87.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.87.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.88.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.88.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.88.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.89.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.89.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.89.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.9.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.9.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.9.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.90.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.90.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.90.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.91.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.91.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.91.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.92.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.92.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.92.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.93.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.93.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.93.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.94.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.94.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.94.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.95.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.95.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.95.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.96.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.96.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.96.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.97.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.97.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.97.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.98.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.98.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.98.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.99.down_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.99.gate_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.experts.99.up_proj.weight": "model-00057-of-00142.safetensors", + "model.layers.38.mlp.gate.e_score_correction_bias": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.gate.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.shared_experts.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.shared_experts.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.mlp.shared_experts.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.38.post_attention_layernorm.weight": "model-00058-of-00142.safetensors", + "model.layers.38.self_attn.k_norm.weight": "model-00056-of-00142.safetensors", + "model.layers.38.self_attn.k_proj.bias": "model-00056-of-00142.safetensors", + "model.layers.38.self_attn.k_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.38.self_attn.o_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.38.self_attn.q_norm.weight": "model-00056-of-00142.safetensors", + "model.layers.38.self_attn.q_proj.bias": "model-00056-of-00142.safetensors", + "model.layers.38.self_attn.q_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.38.self_attn.v_proj.bias": "model-00056-of-00142.safetensors", + "model.layers.38.self_attn.v_proj.weight": "model-00056-of-00142.safetensors", + "model.layers.39.input_layernorm.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.0.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.0.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.1.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.1.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.10.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.10.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.10.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.100.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.100.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.100.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.101.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.101.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.101.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.102.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.102.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.102.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.103.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.103.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.103.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.104.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.104.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.104.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.105.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.105.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.105.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.106.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.106.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.106.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.107.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.107.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.107.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.108.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.108.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.108.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.109.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.109.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.109.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.11.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.11.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.11.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.110.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.110.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.110.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.111.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.111.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.111.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.112.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.112.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.112.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.113.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.113.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.113.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.114.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.114.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.114.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.115.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.115.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.115.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.116.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.116.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.116.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.117.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.117.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.117.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.118.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.118.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.118.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.119.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.119.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.119.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.12.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.12.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.12.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.120.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.120.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.120.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.121.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.121.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.121.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.122.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.122.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.122.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.123.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.123.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.123.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.124.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.124.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.124.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.125.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.125.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.125.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.126.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.126.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.126.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.127.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.127.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.127.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.128.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.128.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.128.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.129.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.129.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.129.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.13.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.13.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.13.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.130.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.130.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.130.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.131.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.131.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.131.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.132.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.132.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.132.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.133.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.133.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.133.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.134.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.134.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.134.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.135.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.135.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.135.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.136.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.136.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.136.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.137.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.137.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.137.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.138.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.138.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.138.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.139.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.139.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.139.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.14.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.14.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.14.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.140.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.140.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.140.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.141.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.141.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.141.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.142.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.142.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.142.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.143.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.143.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.143.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.144.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.144.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.144.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.145.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.145.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.145.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.146.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.146.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.146.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.147.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.147.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.147.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.148.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.148.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.148.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.149.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.149.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.149.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.15.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.15.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.15.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.150.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.150.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.150.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.151.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.151.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.151.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.152.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.152.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.152.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.153.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.153.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.153.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.154.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.154.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.154.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.155.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.155.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.155.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.156.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.156.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.156.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.157.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.157.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.157.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.158.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.158.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.158.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.159.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.159.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.159.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.experts.16.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.16.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.16.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.17.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.17.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.17.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.18.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.18.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.18.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.19.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.19.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.19.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.2.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.2.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.20.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.20.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.20.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.21.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.21.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.21.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.22.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.22.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.22.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.23.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.23.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.23.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.24.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.24.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.24.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.25.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.25.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.25.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.26.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.26.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.26.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.27.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.27.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.27.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.28.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.28.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.28.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.29.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.29.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.29.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.3.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.3.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.30.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.30.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.30.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.31.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.31.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.31.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.32.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.32.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.32.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.33.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.33.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.33.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.34.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.34.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.34.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.35.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.35.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.35.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.36.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.36.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.36.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.37.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.37.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.37.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.38.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.38.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.38.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.39.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.39.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.39.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.4.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.4.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.40.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.40.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.40.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.41.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.41.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.41.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.42.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.42.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.42.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.43.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.43.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.43.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.44.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.44.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.44.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.45.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.45.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.45.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.46.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.46.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.46.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.47.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.47.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.47.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.48.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.48.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.48.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.49.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.49.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.49.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.5.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.5.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.50.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.50.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.50.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.51.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.51.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.51.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.52.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.52.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.52.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.53.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.53.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.53.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.54.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.54.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.54.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.55.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.55.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.55.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.56.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.56.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.56.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.57.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.57.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.57.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.58.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.58.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.58.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.59.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.59.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.59.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.6.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.6.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.60.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.60.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.60.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.61.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.61.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.61.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.62.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.62.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.62.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.63.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.63.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.63.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.64.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.64.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.64.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.65.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.65.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.65.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.66.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.66.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.66.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.67.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.67.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.67.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.68.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.68.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.68.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.69.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.69.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.69.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.7.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.7.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.70.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.70.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.70.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.71.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.71.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.71.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.72.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.72.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.72.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.73.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.73.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.73.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.74.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.74.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.74.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.75.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.75.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.75.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.76.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.76.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.76.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.77.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.77.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.77.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.78.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.78.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.78.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.79.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.79.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.79.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.8.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.8.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.8.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.80.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.80.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.80.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.81.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.81.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.81.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.82.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.82.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.82.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.83.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.83.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.83.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.84.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.84.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.84.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.85.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.85.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.85.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.86.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.86.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.86.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.87.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.87.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.87.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.88.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.88.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.88.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.89.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.89.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.89.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.9.down_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.9.gate_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.9.up_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.mlp.experts.90.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.90.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.90.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.91.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.91.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.91.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.92.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.92.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.92.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.93.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.93.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.93.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.94.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.94.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.94.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.95.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.95.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.95.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.96.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.96.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.96.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.97.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.97.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.97.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.98.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.98.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.98.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.99.down_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.99.gate_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.experts.99.up_proj.weight": "model-00059-of-00142.safetensors", + "model.layers.39.mlp.gate.e_score_correction_bias": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.gate.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.shared_experts.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.shared_experts.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.mlp.shared_experts.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.39.post_attention_layernorm.weight": "model-00060-of-00142.safetensors", + "model.layers.39.self_attn.k_norm.weight": "model-00058-of-00142.safetensors", + "model.layers.39.self_attn.k_proj.bias": "model-00058-of-00142.safetensors", + "model.layers.39.self_attn.k_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.self_attn.o_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.self_attn.q_norm.weight": "model-00058-of-00142.safetensors", + "model.layers.39.self_attn.q_proj.bias": "model-00058-of-00142.safetensors", + "model.layers.39.self_attn.q_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.39.self_attn.v_proj.bias": "model-00058-of-00142.safetensors", + "model.layers.39.self_attn.v_proj.weight": "model-00058-of-00142.safetensors", + "model.layers.4.input_layernorm.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.0.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.0.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.0.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.1.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.1.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.1.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.10.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.10.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.10.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.100.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.100.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.100.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.101.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.101.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.101.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.102.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.102.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.102.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.103.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.103.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.103.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.104.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.104.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.104.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.105.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.105.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.105.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.106.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.106.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.106.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.107.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.107.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.107.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.108.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.108.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.108.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.109.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.109.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.109.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.11.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.11.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.11.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.110.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.110.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.110.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.111.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.111.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.111.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.112.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.112.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.112.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.113.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.113.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.113.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.114.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.114.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.114.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.115.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.115.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.115.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.116.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.116.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.116.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.117.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.117.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.117.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.118.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.118.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.118.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.119.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.119.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.119.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.12.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.12.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.12.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.120.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.120.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.120.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.121.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.121.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.121.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.122.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.122.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.122.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.123.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.123.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.123.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.124.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.124.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.124.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.125.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.125.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.125.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.126.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.126.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.126.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.127.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.127.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.127.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.128.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.128.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.128.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.129.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.129.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.129.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.13.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.13.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.13.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.130.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.130.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.130.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.131.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.131.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.131.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.132.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.132.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.132.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.133.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.133.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.133.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.134.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.134.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.134.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.135.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.135.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.135.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.136.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.136.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.136.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.137.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.137.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.137.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.138.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.138.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.138.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.139.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.139.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.139.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.14.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.14.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.14.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.140.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.140.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.140.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.141.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.141.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.141.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.142.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.142.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.142.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.143.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.143.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.143.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.144.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.144.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.144.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.145.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.145.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.145.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.146.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.146.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.146.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.147.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.147.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.147.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.148.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.148.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.148.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.149.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.149.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.149.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.15.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.15.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.15.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.150.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.150.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.150.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.151.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.151.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.151.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.152.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.152.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.152.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.153.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.153.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.153.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.154.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.154.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.154.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.155.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.155.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.155.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.156.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.156.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.156.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.157.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.157.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.157.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.158.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.158.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.158.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.159.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.159.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.159.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.16.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.16.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.16.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.17.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.17.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.17.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.18.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.18.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.18.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.19.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.19.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.19.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.2.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.2.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.2.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.20.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.20.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.20.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.21.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.21.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.21.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.22.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.22.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.22.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.23.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.23.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.23.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.24.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.24.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.24.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.25.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.25.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.25.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.26.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.26.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.26.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.27.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.27.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.27.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.28.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.28.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.28.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.29.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.29.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.29.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.3.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.3.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.3.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.30.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.30.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.30.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.31.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.31.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.31.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.32.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.32.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.32.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.33.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.33.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.33.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.34.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.34.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.34.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.35.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.35.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.35.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.36.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.36.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.36.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.37.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.37.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.37.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.38.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.38.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.38.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.39.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.39.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.39.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.4.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.4.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.4.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.40.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.40.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.40.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.41.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.41.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.41.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.42.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.42.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.42.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.43.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.43.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.43.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.44.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.44.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.44.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.45.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.45.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.45.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.46.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.46.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.46.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.47.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.47.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.47.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.48.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.48.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.48.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.49.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.49.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.49.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.5.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.5.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.5.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.50.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.50.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.50.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.51.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.51.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.51.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.52.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.52.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.52.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.53.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.53.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.53.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.54.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.54.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.54.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.55.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.55.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.55.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.56.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.56.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.56.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.57.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.57.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.57.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.58.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.58.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.58.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.59.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.59.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.59.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.6.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.6.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.6.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.60.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.60.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.60.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.61.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.61.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.61.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.62.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.62.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.62.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.63.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.63.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.64.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.64.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.65.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.65.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.65.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.66.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.66.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.66.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.67.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.67.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.67.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.68.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.68.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.68.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.69.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.69.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.69.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.7.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.7.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.70.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.70.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.70.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.71.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.71.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.71.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.72.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.72.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.72.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.73.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.73.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.73.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.74.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.74.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.74.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.75.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.75.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.75.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.76.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.76.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.76.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.77.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.77.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.77.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.78.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.78.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.78.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.79.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.79.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.79.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.8.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.8.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.8.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.80.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.80.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.80.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.81.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.81.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.81.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.82.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.82.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.82.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.83.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.83.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.83.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.84.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.84.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.84.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.85.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.85.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.85.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.86.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.86.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.86.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.87.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.87.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.87.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.88.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.88.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.88.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.89.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.89.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.89.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.9.down_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.9.gate_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.9.up_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.mlp.experts.90.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.90.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.90.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.91.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.91.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.91.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.92.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.92.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.92.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.93.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.93.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.93.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.94.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.94.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.94.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.95.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.95.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.95.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.96.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.96.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.96.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.97.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.97.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.97.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.98.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.98.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.98.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.99.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.99.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.experts.99.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.gate.e_score_correction_bias": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.gate.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.shared_experts.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.shared_experts.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.mlp.shared_experts.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00004-of-00142.safetensors", + "model.layers.4.self_attn.k_norm.weight": "model-00003-of-00142.safetensors", + "model.layers.4.self_attn.k_proj.bias": "model-00003-of-00142.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.self_attn.q_norm.weight": "model-00003-of-00142.safetensors", + "model.layers.4.self_attn.q_proj.bias": "model-00003-of-00142.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.4.self_attn.v_proj.bias": "model-00003-of-00142.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00003-of-00142.safetensors", + "model.layers.40.input_layernorm.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.0.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.0.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.0.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.1.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.1.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.1.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.10.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.10.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.10.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.100.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.100.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.100.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.101.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.101.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.101.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.102.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.102.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.102.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.103.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.103.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.103.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.104.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.104.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.104.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.105.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.105.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.105.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.106.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.106.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.106.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.107.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.107.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.107.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.108.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.108.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.108.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.109.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.109.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.109.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.11.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.11.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.11.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.110.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.110.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.110.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.111.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.111.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.111.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.112.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.112.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.112.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.113.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.113.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.113.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.114.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.114.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.114.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.115.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.115.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.115.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.116.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.116.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.116.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.117.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.117.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.117.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.118.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.118.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.118.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.119.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.119.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.119.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.12.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.12.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.12.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.120.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.120.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.120.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.121.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.121.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.121.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.122.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.122.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.122.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.123.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.123.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.123.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.124.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.124.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.124.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.125.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.125.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.125.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.126.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.126.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.126.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.127.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.127.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.127.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.128.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.128.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.128.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.129.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.129.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.129.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.13.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.13.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.13.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.130.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.130.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.130.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.131.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.131.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.131.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.132.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.132.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.132.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.133.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.133.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.133.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.134.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.134.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.134.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.135.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.135.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.135.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.136.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.136.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.136.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.137.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.137.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.137.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.138.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.138.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.138.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.139.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.139.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.139.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.14.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.14.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.14.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.140.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.140.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.140.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.141.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.141.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.141.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.142.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.142.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.142.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.143.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.143.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.143.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.144.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.144.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.144.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.145.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.145.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.145.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.146.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.146.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.146.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.147.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.147.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.147.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.148.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.148.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.148.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.149.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.149.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.149.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.15.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.15.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.15.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.150.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.150.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.150.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.151.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.151.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.151.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.152.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.152.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.152.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.153.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.153.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.153.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.154.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.154.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.154.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.155.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.155.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.155.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.156.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.156.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.156.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.157.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.157.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.157.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.158.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.158.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.158.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.159.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.159.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.159.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.16.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.16.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.16.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.17.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.17.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.17.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.18.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.18.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.18.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.19.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.19.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.19.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.2.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.2.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.2.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.20.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.20.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.20.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.21.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.21.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.21.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.22.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.22.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.22.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.23.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.23.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.23.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.24.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.24.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.24.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.25.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.25.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.25.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.26.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.26.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.26.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.27.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.27.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.27.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.28.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.28.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.28.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.29.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.29.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.29.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.3.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.3.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.3.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.30.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.30.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.30.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.31.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.31.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.31.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.32.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.32.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.32.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.33.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.33.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.33.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.34.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.34.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.34.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.35.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.35.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.35.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.36.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.36.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.36.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.37.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.37.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.37.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.38.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.38.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.38.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.39.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.39.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.39.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.4.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.4.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.4.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.40.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.40.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.40.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.41.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.41.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.41.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.42.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.42.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.42.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.43.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.43.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.43.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.44.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.44.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.44.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.45.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.45.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.45.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.46.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.46.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.46.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.47.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.47.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.47.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.48.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.48.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.48.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.49.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.49.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.49.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.5.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.5.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.5.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.50.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.50.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.50.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.51.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.51.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.51.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.52.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.52.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.52.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.53.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.53.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.53.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.54.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.54.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.54.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.55.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.55.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.55.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.56.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.56.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.56.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.57.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.57.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.57.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.58.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.58.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.58.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.59.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.59.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.59.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.6.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.6.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.6.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.60.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.60.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.60.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.61.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.61.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.61.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.62.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.62.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.62.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.63.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.63.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.63.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.64.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.64.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.64.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.65.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.65.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.65.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.66.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.66.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.66.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.67.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.67.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.67.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.68.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.68.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.68.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.69.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.69.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.69.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.7.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.7.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.7.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.70.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.70.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.70.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.71.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.71.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.71.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.72.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.72.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.72.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.73.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.73.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.73.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.74.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.74.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.74.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.75.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.75.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.75.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.76.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.76.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.76.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.77.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.77.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.77.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.78.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.78.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.78.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.79.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.79.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.79.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.8.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.8.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.8.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.80.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.80.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.80.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.81.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.81.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.81.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.82.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.82.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.82.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.83.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.83.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.83.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.84.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.84.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.84.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.85.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.85.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.85.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.86.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.86.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.86.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.87.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.87.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.87.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.88.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.88.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.88.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.89.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.89.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.89.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.9.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.9.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.9.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.90.down_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.90.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.90.up_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.91.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.91.gate_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.mlp.experts.91.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.92.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.92.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.92.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.93.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.93.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.93.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.94.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.94.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.94.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.95.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.95.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.95.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.96.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.96.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.96.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.97.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.97.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.97.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.98.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.98.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.98.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.99.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.99.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.experts.99.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.gate.e_score_correction_bias": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.gate.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.shared_experts.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.shared_experts.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.mlp.shared_experts.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.40.post_attention_layernorm.weight": "model-00061-of-00142.safetensors", + "model.layers.40.self_attn.k_norm.weight": "model-00060-of-00142.safetensors", + "model.layers.40.self_attn.k_proj.bias": "model-00060-of-00142.safetensors", + "model.layers.40.self_attn.k_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.self_attn.o_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.self_attn.q_norm.weight": "model-00060-of-00142.safetensors", + "model.layers.40.self_attn.q_proj.bias": "model-00060-of-00142.safetensors", + "model.layers.40.self_attn.q_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.40.self_attn.v_proj.bias": "model-00060-of-00142.safetensors", + "model.layers.40.self_attn.v_proj.weight": "model-00060-of-00142.safetensors", + "model.layers.41.input_layernorm.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.0.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.0.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.1.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.1.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.10.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.10.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.10.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.100.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.100.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.100.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.101.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.101.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.101.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.102.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.102.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.102.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.103.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.103.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.103.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.104.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.104.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.104.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.105.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.105.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.105.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.106.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.106.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.106.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.107.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.107.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.107.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.108.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.108.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.108.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.109.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.109.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.109.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.11.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.11.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.11.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.110.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.110.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.110.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.111.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.111.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.111.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.112.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.112.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.112.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.113.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.113.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.113.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.114.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.114.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.114.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.115.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.115.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.115.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.116.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.116.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.116.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.117.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.117.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.117.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.118.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.118.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.118.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.119.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.119.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.119.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.12.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.12.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.12.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.120.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.120.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.120.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.121.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.121.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.121.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.122.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.122.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.122.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.123.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.123.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.123.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.124.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.124.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.124.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.125.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.125.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.125.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.126.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.126.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.126.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.127.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.127.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.127.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.128.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.128.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.128.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.129.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.129.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.129.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.13.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.13.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.13.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.130.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.130.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.130.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.131.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.131.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.131.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.132.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.132.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.132.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.133.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.133.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.133.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.134.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.134.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.134.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.135.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.135.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.135.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.136.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.136.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.136.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.137.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.137.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.137.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.138.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.138.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.138.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.139.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.139.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.139.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.14.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.14.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.14.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.140.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.140.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.140.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.141.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.141.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.141.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.142.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.142.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.142.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.143.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.143.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.143.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.144.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.144.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.144.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.145.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.145.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.145.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.146.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.146.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.146.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.147.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.147.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.147.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.148.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.148.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.148.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.149.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.149.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.149.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.15.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.15.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.15.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.150.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.150.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.150.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.151.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.151.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.151.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.152.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.152.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.152.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.153.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.153.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.153.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.154.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.154.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.154.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.155.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.155.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.155.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.156.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.156.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.156.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.157.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.157.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.157.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.158.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.158.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.158.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.159.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.159.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.159.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.experts.16.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.16.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.16.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.17.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.17.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.17.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.18.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.18.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.18.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.19.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.19.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.19.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.2.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.2.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.20.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.20.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.20.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.21.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.21.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.21.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.22.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.22.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.22.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.23.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.23.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.23.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.24.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.24.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.24.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.25.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.25.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.25.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.26.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.26.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.26.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.27.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.27.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.27.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.28.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.28.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.28.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.29.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.29.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.29.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.3.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.3.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.30.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.30.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.30.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.31.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.31.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.31.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.32.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.32.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.32.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.33.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.33.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.33.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.34.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.34.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.34.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.35.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.35.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.35.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.36.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.36.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.36.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.37.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.37.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.37.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.38.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.38.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.38.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.39.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.39.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.39.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.4.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.4.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.40.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.40.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.40.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.41.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.41.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.41.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.42.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.42.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.42.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.43.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.43.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.43.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.44.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.44.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.44.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.45.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.45.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.45.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.46.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.46.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.46.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.47.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.47.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.47.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.48.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.48.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.48.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.49.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.49.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.49.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.5.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.5.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.50.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.50.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.50.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.51.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.51.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.51.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.52.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.52.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.52.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.53.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.53.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.53.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.54.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.54.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.54.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.55.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.55.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.55.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.56.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.56.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.56.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.57.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.57.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.57.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.58.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.58.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.58.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.59.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.59.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.59.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.6.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.6.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.60.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.60.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.60.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.61.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.61.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.61.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.62.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.62.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.62.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.63.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.63.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.63.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.64.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.64.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.64.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.65.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.65.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.65.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.66.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.66.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.66.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.67.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.67.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.67.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.68.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.68.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.68.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.69.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.69.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.69.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.7.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.7.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.70.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.70.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.70.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.71.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.71.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.71.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.72.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.72.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.72.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.73.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.73.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.73.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.74.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.74.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.74.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.75.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.75.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.75.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.76.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.76.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.76.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.77.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.77.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.77.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.78.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.78.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.78.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.79.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.79.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.79.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.8.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.8.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.8.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.80.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.80.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.80.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.81.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.81.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.81.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.82.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.82.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.82.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.83.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.83.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.83.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.84.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.84.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.84.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.85.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.85.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.85.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.86.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.86.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.86.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.87.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.87.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.87.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.88.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.88.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.88.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.89.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.89.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.89.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.9.down_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.9.gate_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.9.up_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.mlp.experts.90.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.90.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.90.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.91.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.91.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.91.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.92.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.92.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.92.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.93.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.93.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.93.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.94.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.94.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.94.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.95.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.95.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.95.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.96.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.96.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.96.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.97.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.97.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.97.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.98.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.98.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.98.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.99.down_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.99.gate_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.experts.99.up_proj.weight": "model-00062-of-00142.safetensors", + "model.layers.41.mlp.gate.e_score_correction_bias": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.gate.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.shared_experts.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.shared_experts.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.mlp.shared_experts.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.41.post_attention_layernorm.weight": "model-00063-of-00142.safetensors", + "model.layers.41.self_attn.k_norm.weight": "model-00061-of-00142.safetensors", + "model.layers.41.self_attn.k_proj.bias": "model-00061-of-00142.safetensors", + "model.layers.41.self_attn.k_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.self_attn.o_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.self_attn.q_norm.weight": "model-00061-of-00142.safetensors", + "model.layers.41.self_attn.q_proj.bias": "model-00061-of-00142.safetensors", + "model.layers.41.self_attn.q_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.41.self_attn.v_proj.bias": "model-00061-of-00142.safetensors", + "model.layers.41.self_attn.v_proj.weight": "model-00061-of-00142.safetensors", + "model.layers.42.input_layernorm.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.0.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.0.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.0.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.1.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.1.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.1.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.10.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.10.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.10.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.100.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.100.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.100.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.101.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.101.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.101.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.102.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.102.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.102.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.103.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.103.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.103.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.104.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.104.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.104.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.105.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.105.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.105.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.106.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.106.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.106.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.107.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.107.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.107.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.108.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.108.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.108.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.109.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.109.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.109.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.11.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.11.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.11.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.110.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.110.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.110.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.111.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.111.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.111.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.112.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.112.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.112.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.113.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.113.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.113.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.114.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.114.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.114.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.115.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.115.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.115.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.116.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.116.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.116.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.117.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.117.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.117.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.118.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.118.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.118.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.119.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.119.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.119.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.12.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.12.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.12.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.120.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.120.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.120.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.121.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.121.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.121.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.122.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.122.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.122.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.123.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.123.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.123.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.124.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.124.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.124.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.125.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.125.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.125.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.126.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.126.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.126.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.127.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.127.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.127.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.128.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.128.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.128.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.129.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.129.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.129.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.13.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.13.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.13.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.130.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.130.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.130.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.131.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.131.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.131.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.132.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.132.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.132.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.133.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.133.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.133.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.134.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.134.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.134.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.135.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.135.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.135.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.136.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.136.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.136.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.137.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.137.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.137.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.138.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.138.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.138.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.139.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.139.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.139.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.14.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.14.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.14.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.140.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.140.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.140.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.141.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.141.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.141.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.142.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.142.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.142.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.143.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.143.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.143.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.144.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.144.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.144.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.145.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.145.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.145.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.146.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.146.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.146.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.147.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.147.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.147.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.148.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.148.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.148.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.149.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.149.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.149.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.15.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.15.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.15.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.150.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.150.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.150.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.151.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.151.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.151.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.152.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.152.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.152.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.153.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.153.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.153.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.154.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.154.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.154.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.155.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.155.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.155.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.156.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.156.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.156.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.157.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.157.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.157.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.158.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.158.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.158.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.159.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.159.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.159.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.16.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.16.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.16.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.17.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.17.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.17.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.18.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.18.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.18.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.19.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.19.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.19.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.2.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.2.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.2.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.20.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.20.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.20.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.21.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.21.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.21.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.22.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.22.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.22.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.23.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.23.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.23.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.24.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.24.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.24.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.25.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.25.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.25.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.26.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.26.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.26.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.27.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.27.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.27.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.28.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.28.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.28.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.29.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.29.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.29.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.3.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.3.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.3.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.30.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.30.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.30.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.31.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.31.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.31.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.32.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.32.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.32.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.33.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.33.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.33.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.34.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.34.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.34.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.35.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.35.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.35.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.36.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.36.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.36.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.37.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.37.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.37.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.38.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.38.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.38.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.39.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.39.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.39.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.4.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.4.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.4.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.40.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.40.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.40.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.41.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.41.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.41.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.42.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.42.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.42.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.43.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.43.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.43.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.44.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.44.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.44.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.45.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.45.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.45.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.46.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.46.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.46.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.47.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.47.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.47.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.48.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.48.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.48.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.49.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.49.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.49.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.5.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.5.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.5.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.50.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.50.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.50.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.51.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.51.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.51.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.52.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.52.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.52.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.53.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.53.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.53.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.54.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.54.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.54.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.55.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.55.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.55.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.56.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.56.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.56.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.57.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.57.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.57.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.58.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.58.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.58.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.59.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.59.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.59.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.6.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.6.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.6.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.60.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.60.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.60.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.61.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.61.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.61.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.62.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.62.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.62.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.63.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.63.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.63.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.64.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.64.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.64.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.65.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.65.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.65.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.66.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.66.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.66.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.67.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.67.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.67.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.68.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.68.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.68.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.69.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.69.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.69.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.7.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.7.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.7.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.70.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.70.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.70.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.71.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.71.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.71.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.72.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.72.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.72.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.73.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.73.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.73.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.74.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.74.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.74.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.75.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.75.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.75.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.76.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.76.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.76.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.77.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.77.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.77.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.78.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.78.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.78.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.79.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.79.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.79.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.8.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.8.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.8.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.80.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.80.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.80.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.81.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.81.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.81.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.82.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.82.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.82.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.83.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.83.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.83.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.84.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.84.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.84.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.85.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.85.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.85.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.86.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.86.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.86.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.87.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.87.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.87.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.88.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.88.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.88.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.89.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.89.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.89.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.9.down_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.9.gate_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.9.up_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.mlp.experts.90.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.90.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.90.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.91.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.91.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.91.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.92.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.92.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.92.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.93.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.93.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.93.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.94.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.94.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.94.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.95.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.95.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.95.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.96.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.96.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.96.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.97.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.97.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.97.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.98.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.98.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.98.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.99.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.99.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.experts.99.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.gate.e_score_correction_bias": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.gate.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.shared_experts.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.shared_experts.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.mlp.shared_experts.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.42.post_attention_layernorm.weight": "model-00064-of-00142.safetensors", + "model.layers.42.self_attn.k_norm.weight": "model-00063-of-00142.safetensors", + "model.layers.42.self_attn.k_proj.bias": "model-00063-of-00142.safetensors", + "model.layers.42.self_attn.k_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.self_attn.o_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.self_attn.q_norm.weight": "model-00063-of-00142.safetensors", + "model.layers.42.self_attn.q_proj.bias": "model-00063-of-00142.safetensors", + "model.layers.42.self_attn.q_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.42.self_attn.v_proj.bias": "model-00063-of-00142.safetensors", + "model.layers.42.self_attn.v_proj.weight": "model-00063-of-00142.safetensors", + "model.layers.43.input_layernorm.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.0.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.0.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.1.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.1.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.10.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.10.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.10.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.100.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.100.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.100.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.101.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.101.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.101.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.102.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.102.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.102.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.103.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.103.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.103.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.104.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.104.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.104.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.105.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.105.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.105.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.106.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.106.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.106.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.107.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.107.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.107.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.108.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.108.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.108.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.109.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.109.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.109.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.11.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.11.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.11.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.110.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.110.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.110.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.111.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.111.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.111.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.112.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.112.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.112.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.113.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.113.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.113.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.114.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.114.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.114.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.115.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.115.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.115.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.116.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.116.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.116.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.117.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.117.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.117.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.118.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.118.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.118.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.119.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.119.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.119.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.12.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.12.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.12.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.120.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.120.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.120.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.121.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.121.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.121.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.122.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.122.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.122.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.123.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.123.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.123.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.124.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.124.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.124.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.125.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.125.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.125.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.126.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.126.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.126.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.127.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.127.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.127.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.128.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.128.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.128.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.129.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.129.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.129.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.13.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.13.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.13.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.130.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.130.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.130.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.131.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.131.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.131.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.132.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.132.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.132.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.133.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.133.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.133.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.134.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.134.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.134.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.135.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.135.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.135.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.136.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.136.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.136.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.137.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.137.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.137.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.138.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.138.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.138.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.139.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.139.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.139.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.14.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.14.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.14.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.140.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.140.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.140.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.141.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.141.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.141.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.142.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.142.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.142.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.143.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.143.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.143.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.144.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.144.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.144.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.145.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.145.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.145.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.146.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.146.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.146.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.147.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.147.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.147.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.148.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.148.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.148.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.149.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.149.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.149.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.15.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.15.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.15.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.150.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.150.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.150.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.151.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.151.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.151.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.152.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.152.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.152.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.153.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.153.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.153.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.154.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.154.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.154.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.155.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.155.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.155.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.156.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.156.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.156.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.157.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.157.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.157.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.158.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.158.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.158.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.159.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.159.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.159.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.experts.16.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.16.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.16.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.17.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.17.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.17.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.18.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.18.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.18.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.19.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.19.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.19.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.2.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.2.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.20.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.20.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.20.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.21.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.21.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.21.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.22.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.22.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.22.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.23.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.23.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.23.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.24.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.24.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.24.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.25.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.25.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.25.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.26.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.26.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.26.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.27.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.27.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.27.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.28.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.28.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.28.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.29.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.29.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.29.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.3.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.3.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.30.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.30.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.30.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.31.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.31.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.31.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.32.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.32.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.32.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.33.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.33.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.33.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.34.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.34.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.34.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.35.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.35.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.35.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.36.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.36.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.36.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.37.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.37.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.37.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.38.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.38.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.38.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.39.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.39.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.39.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.4.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.4.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.40.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.40.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.40.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.41.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.41.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.41.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.42.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.42.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.42.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.43.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.43.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.43.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.44.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.44.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.44.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.45.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.45.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.45.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.46.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.46.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.46.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.47.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.47.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.47.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.48.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.48.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.48.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.49.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.49.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.49.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.5.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.5.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.50.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.50.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.50.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.51.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.51.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.51.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.52.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.52.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.52.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.53.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.53.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.53.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.54.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.54.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.54.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.55.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.55.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.55.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.56.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.56.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.56.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.57.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.57.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.57.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.58.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.58.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.58.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.59.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.59.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.59.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.6.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.6.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.60.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.60.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.60.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.61.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.61.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.61.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.62.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.62.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.62.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.63.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.63.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.63.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.64.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.64.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.64.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.65.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.65.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.65.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.66.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.66.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.66.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.67.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.67.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.67.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.68.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.68.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.68.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.69.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.69.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.69.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.7.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.7.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.70.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.70.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.70.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.71.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.71.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.71.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.72.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.72.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.72.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.73.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.73.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.73.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.74.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.74.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.74.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.75.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.75.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.75.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.76.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.76.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.76.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.77.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.77.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.77.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.78.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.78.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.78.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.79.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.79.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.79.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.8.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.8.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.8.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.80.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.80.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.80.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.81.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.81.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.81.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.82.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.82.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.82.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.83.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.83.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.83.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.84.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.84.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.84.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.85.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.85.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.85.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.86.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.86.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.86.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.87.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.87.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.87.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.88.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.88.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.88.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.89.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.89.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.89.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.9.down_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.9.gate_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.9.up_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.mlp.experts.90.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.90.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.90.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.91.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.91.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.91.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.92.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.92.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.92.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.93.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.93.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.93.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.94.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.94.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.94.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.95.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.95.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.95.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.96.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.96.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.96.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.97.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.97.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.97.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.98.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.98.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.98.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.99.down_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.99.gate_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.experts.99.up_proj.weight": "model-00065-of-00142.safetensors", + "model.layers.43.mlp.gate.e_score_correction_bias": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.gate.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.shared_experts.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.shared_experts.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.mlp.shared_experts.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.43.post_attention_layernorm.weight": "model-00066-of-00142.safetensors", + "model.layers.43.self_attn.k_norm.weight": "model-00064-of-00142.safetensors", + "model.layers.43.self_attn.k_proj.bias": "model-00064-of-00142.safetensors", + "model.layers.43.self_attn.k_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.self_attn.o_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.self_attn.q_norm.weight": "model-00064-of-00142.safetensors", + "model.layers.43.self_attn.q_proj.bias": "model-00064-of-00142.safetensors", + "model.layers.43.self_attn.q_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.43.self_attn.v_proj.bias": "model-00064-of-00142.safetensors", + "model.layers.43.self_attn.v_proj.weight": "model-00064-of-00142.safetensors", + "model.layers.44.input_layernorm.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.0.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.0.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.0.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.1.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.1.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.1.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.10.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.10.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.10.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.100.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.100.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.100.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.101.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.101.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.101.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.102.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.102.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.102.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.103.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.103.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.103.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.104.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.104.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.104.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.105.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.105.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.105.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.106.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.106.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.106.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.107.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.107.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.107.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.108.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.108.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.108.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.109.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.109.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.109.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.11.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.11.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.11.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.110.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.110.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.110.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.111.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.111.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.111.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.112.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.112.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.112.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.113.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.113.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.113.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.114.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.114.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.114.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.115.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.115.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.115.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.116.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.116.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.116.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.117.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.117.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.117.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.118.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.118.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.118.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.119.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.119.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.119.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.12.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.12.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.12.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.120.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.120.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.120.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.121.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.121.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.121.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.122.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.122.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.122.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.123.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.123.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.123.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.124.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.124.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.124.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.125.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.125.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.125.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.126.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.126.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.126.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.127.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.127.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.127.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.128.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.128.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.128.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.129.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.129.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.129.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.13.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.13.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.13.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.130.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.130.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.130.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.131.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.131.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.131.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.132.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.132.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.132.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.133.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.133.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.133.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.134.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.134.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.134.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.135.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.135.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.135.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.136.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.136.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.136.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.137.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.137.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.137.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.138.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.138.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.138.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.139.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.139.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.139.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.14.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.14.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.14.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.140.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.140.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.140.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.141.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.141.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.141.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.142.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.142.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.142.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.143.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.143.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.143.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.144.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.144.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.144.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.145.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.145.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.145.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.146.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.146.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.146.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.147.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.147.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.147.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.148.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.148.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.148.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.149.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.149.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.149.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.15.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.15.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.15.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.150.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.150.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.150.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.151.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.151.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.151.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.152.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.152.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.152.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.153.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.153.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.153.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.154.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.154.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.154.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.155.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.155.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.155.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.156.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.156.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.156.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.157.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.157.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.157.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.158.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.158.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.158.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.159.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.159.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.159.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.16.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.16.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.16.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.17.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.17.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.17.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.18.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.18.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.18.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.19.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.19.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.19.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.2.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.2.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.2.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.20.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.20.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.20.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.21.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.21.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.21.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.22.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.22.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.22.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.23.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.23.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.23.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.24.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.24.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.24.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.25.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.25.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.25.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.26.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.26.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.26.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.27.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.27.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.27.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.28.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.28.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.28.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.29.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.29.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.29.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.3.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.3.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.3.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.30.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.30.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.30.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.31.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.31.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.31.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.32.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.32.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.32.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.33.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.33.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.33.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.34.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.34.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.34.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.35.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.35.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.35.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.36.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.36.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.36.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.37.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.37.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.37.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.38.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.38.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.38.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.39.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.39.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.39.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.4.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.4.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.4.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.40.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.40.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.40.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.41.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.41.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.41.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.42.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.42.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.42.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.43.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.43.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.43.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.44.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.44.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.44.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.45.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.45.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.45.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.46.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.46.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.46.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.47.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.47.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.47.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.48.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.48.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.48.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.49.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.49.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.49.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.5.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.5.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.5.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.50.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.50.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.50.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.51.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.51.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.51.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.52.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.52.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.52.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.53.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.53.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.53.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.54.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.54.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.54.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.55.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.55.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.55.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.56.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.56.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.56.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.57.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.57.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.57.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.58.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.58.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.58.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.59.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.59.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.59.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.6.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.6.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.6.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.60.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.60.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.60.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.61.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.61.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.61.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.62.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.62.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.62.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.63.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.63.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.63.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.64.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.64.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.64.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.65.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.65.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.65.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.66.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.66.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.66.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.67.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.67.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.67.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.68.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.68.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.68.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.69.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.69.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.69.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.7.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.7.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.7.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.70.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.70.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.70.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.71.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.71.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.71.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.72.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.72.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.72.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.73.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.73.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.73.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.74.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.74.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.74.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.75.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.75.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.75.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.76.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.76.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.76.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.77.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.77.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.77.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.78.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.78.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.78.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.79.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.79.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.79.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.8.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.8.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.8.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.80.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.80.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.80.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.81.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.81.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.81.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.82.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.82.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.82.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.83.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.83.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.83.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.84.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.84.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.84.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.85.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.85.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.85.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.86.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.86.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.86.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.87.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.87.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.87.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.88.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.88.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.88.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.89.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.89.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.89.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.9.down_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.9.gate_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.9.up_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.mlp.experts.90.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.90.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.90.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.91.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.91.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.91.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.92.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.92.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.92.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.93.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.93.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.93.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.94.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.94.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.94.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.95.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.95.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.95.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.96.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.96.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.96.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.97.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.97.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.97.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.98.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.98.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.98.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.99.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.99.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.experts.99.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.gate.e_score_correction_bias": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.gate.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.shared_experts.down_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.shared_experts.gate_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.mlp.shared_experts.up_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.44.post_attention_layernorm.weight": "model-00067-of-00142.safetensors", + "model.layers.44.self_attn.k_norm.weight": "model-00066-of-00142.safetensors", + "model.layers.44.self_attn.k_proj.bias": "model-00066-of-00142.safetensors", + "model.layers.44.self_attn.k_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.self_attn.o_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.self_attn.q_norm.weight": "model-00066-of-00142.safetensors", + "model.layers.44.self_attn.q_proj.bias": "model-00066-of-00142.safetensors", + "model.layers.44.self_attn.q_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.44.self_attn.v_proj.bias": "model-00066-of-00142.safetensors", + "model.layers.44.self_attn.v_proj.weight": "model-00066-of-00142.safetensors", + "model.layers.45.input_layernorm.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.0.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.0.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.1.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.1.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.10.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.10.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.10.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.100.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.100.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.100.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.101.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.101.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.101.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.102.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.102.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.102.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.103.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.103.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.103.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.104.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.104.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.104.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.105.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.105.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.105.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.106.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.106.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.106.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.107.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.107.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.107.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.108.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.108.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.108.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.109.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.109.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.109.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.11.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.11.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.11.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.110.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.110.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.110.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.111.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.111.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.111.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.112.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.112.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.112.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.113.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.113.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.113.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.114.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.114.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.114.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.115.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.115.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.115.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.116.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.116.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.116.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.117.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.117.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.117.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.118.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.118.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.118.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.119.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.119.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.119.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.12.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.12.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.12.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.120.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.120.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.120.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.121.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.121.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.121.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.122.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.122.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.122.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.123.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.123.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.123.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.124.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.124.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.124.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.125.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.125.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.125.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.126.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.126.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.126.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.127.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.127.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.127.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.128.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.128.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.128.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.129.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.129.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.129.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.13.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.13.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.13.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.130.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.130.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.130.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.131.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.131.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.131.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.132.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.132.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.132.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.133.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.133.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.133.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.134.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.134.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.134.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.135.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.135.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.135.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.136.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.136.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.136.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.137.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.137.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.137.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.138.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.138.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.138.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.139.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.139.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.139.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.14.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.14.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.14.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.140.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.140.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.140.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.141.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.141.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.141.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.142.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.142.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.142.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.143.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.143.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.143.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.144.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.144.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.144.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.145.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.145.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.145.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.146.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.146.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.146.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.147.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.147.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.147.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.148.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.148.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.148.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.149.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.149.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.149.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.15.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.15.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.15.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.150.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.150.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.150.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.151.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.151.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.151.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.152.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.152.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.152.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.153.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.153.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.153.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.154.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.154.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.154.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.155.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.155.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.155.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.156.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.156.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.156.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.157.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.157.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.157.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.158.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.158.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.158.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.159.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.159.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.159.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.experts.16.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.16.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.16.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.17.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.17.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.17.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.18.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.18.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.18.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.19.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.19.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.19.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.2.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.2.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.20.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.20.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.20.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.21.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.21.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.21.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.22.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.22.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.22.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.23.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.23.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.23.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.24.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.24.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.24.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.25.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.25.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.25.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.26.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.26.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.26.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.27.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.27.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.27.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.28.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.28.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.28.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.29.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.29.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.29.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.3.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.3.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.30.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.30.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.30.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.31.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.31.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.31.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.32.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.32.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.32.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.33.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.33.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.33.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.34.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.34.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.34.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.35.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.35.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.35.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.36.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.36.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.36.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.37.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.37.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.37.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.38.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.38.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.38.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.39.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.39.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.39.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.4.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.4.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.40.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.40.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.40.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.41.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.41.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.41.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.42.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.42.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.42.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.43.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.43.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.43.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.44.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.44.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.44.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.45.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.45.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.45.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.46.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.46.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.46.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.47.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.47.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.47.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.48.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.48.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.48.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.49.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.49.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.49.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.5.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.5.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.50.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.50.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.50.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.51.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.51.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.51.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.52.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.52.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.52.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.53.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.53.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.53.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.54.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.54.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.54.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.55.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.55.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.55.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.56.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.56.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.56.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.57.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.57.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.57.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.58.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.58.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.58.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.59.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.59.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.59.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.6.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.6.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.60.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.60.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.60.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.61.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.61.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.61.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.62.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.62.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.62.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.63.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.63.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.63.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.64.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.64.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.64.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.65.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.65.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.65.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.66.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.66.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.66.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.67.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.67.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.67.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.68.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.68.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.68.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.69.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.69.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.69.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.7.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.7.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.70.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.70.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.70.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.71.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.71.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.71.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.72.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.72.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.72.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.73.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.73.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.73.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.74.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.74.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.74.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.75.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.75.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.75.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.76.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.76.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.76.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.77.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.77.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.77.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.78.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.78.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.78.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.79.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.79.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.79.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.8.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.8.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.8.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.80.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.80.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.80.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.81.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.81.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.81.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.82.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.82.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.82.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.83.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.83.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.83.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.84.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.84.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.84.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.85.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.85.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.85.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.86.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.86.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.86.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.87.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.87.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.87.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.88.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.88.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.88.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.89.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.89.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.89.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.9.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.9.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.9.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.90.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.90.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.90.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.91.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.91.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.91.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.92.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.92.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.92.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.93.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.93.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.93.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.94.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.94.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.94.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.95.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.95.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.95.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.96.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.96.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.96.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.97.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.97.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.97.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.98.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.98.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.98.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.99.down_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.99.gate_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.experts.99.up_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.mlp.gate.e_score_correction_bias": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.gate.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.shared_experts.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.shared_experts.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.mlp.shared_experts.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.45.post_attention_layernorm.weight": "model-00069-of-00142.safetensors", + "model.layers.45.self_attn.k_norm.weight": "model-00068-of-00142.safetensors", + "model.layers.45.self_attn.k_proj.bias": "model-00067-of-00142.safetensors", + "model.layers.45.self_attn.k_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.45.self_attn.o_proj.weight": "model-00068-of-00142.safetensors", + "model.layers.45.self_attn.q_norm.weight": "model-00068-of-00142.safetensors", + "model.layers.45.self_attn.q_proj.bias": "model-00067-of-00142.safetensors", + "model.layers.45.self_attn.q_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.45.self_attn.v_proj.bias": "model-00067-of-00142.safetensors", + "model.layers.45.self_attn.v_proj.weight": "model-00067-of-00142.safetensors", + "model.layers.46.input_layernorm.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.0.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.0.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.0.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.1.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.1.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.1.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.10.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.10.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.10.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.100.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.100.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.100.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.101.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.101.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.101.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.102.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.102.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.102.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.103.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.103.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.103.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.104.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.104.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.104.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.105.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.105.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.105.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.106.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.106.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.106.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.107.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.107.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.107.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.108.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.108.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.108.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.109.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.109.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.109.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.11.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.11.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.11.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.110.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.110.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.110.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.111.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.111.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.111.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.112.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.112.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.112.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.113.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.113.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.113.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.114.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.114.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.114.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.115.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.115.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.115.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.116.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.116.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.116.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.117.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.117.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.117.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.118.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.118.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.118.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.119.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.119.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.119.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.12.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.12.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.12.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.120.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.120.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.120.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.121.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.121.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.121.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.122.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.122.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.122.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.123.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.123.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.123.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.124.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.124.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.124.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.125.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.125.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.125.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.126.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.126.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.126.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.127.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.127.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.127.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.128.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.128.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.128.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.129.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.129.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.129.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.13.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.13.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.13.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.130.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.130.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.130.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.131.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.131.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.131.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.132.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.132.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.132.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.133.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.133.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.133.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.134.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.134.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.134.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.135.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.135.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.135.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.136.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.136.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.136.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.137.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.137.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.137.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.138.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.138.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.138.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.139.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.139.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.139.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.14.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.14.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.14.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.140.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.140.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.140.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.141.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.141.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.141.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.142.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.142.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.142.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.143.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.143.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.143.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.144.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.144.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.144.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.145.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.145.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.145.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.146.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.146.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.146.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.147.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.147.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.147.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.148.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.148.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.148.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.149.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.149.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.149.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.15.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.15.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.15.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.150.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.150.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.150.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.151.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.151.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.151.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.152.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.152.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.152.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.153.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.153.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.153.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.154.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.154.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.154.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.155.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.155.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.155.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.156.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.156.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.156.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.157.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.157.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.157.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.158.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.158.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.158.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.159.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.159.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.159.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.experts.16.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.16.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.16.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.17.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.17.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.17.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.18.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.18.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.18.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.19.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.19.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.19.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.2.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.2.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.2.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.20.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.20.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.20.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.21.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.21.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.21.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.22.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.22.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.22.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.23.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.23.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.23.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.24.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.24.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.24.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.25.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.25.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.25.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.26.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.26.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.26.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.27.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.27.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.27.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.28.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.28.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.28.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.29.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.29.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.29.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.3.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.3.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.3.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.30.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.30.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.30.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.31.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.31.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.31.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.32.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.32.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.32.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.33.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.33.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.33.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.34.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.34.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.34.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.35.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.35.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.35.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.36.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.36.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.36.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.37.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.37.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.37.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.38.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.38.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.38.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.39.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.39.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.39.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.4.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.4.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.4.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.40.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.40.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.40.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.41.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.41.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.41.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.42.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.42.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.42.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.43.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.43.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.43.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.44.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.44.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.44.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.45.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.45.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.45.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.46.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.46.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.46.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.47.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.47.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.47.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.48.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.48.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.48.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.49.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.49.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.49.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.5.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.5.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.5.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.50.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.50.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.50.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.51.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.51.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.51.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.52.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.52.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.52.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.53.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.53.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.53.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.54.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.54.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.54.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.55.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.55.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.55.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.56.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.56.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.56.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.57.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.57.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.57.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.58.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.58.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.58.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.59.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.59.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.59.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.6.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.6.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.6.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.60.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.60.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.60.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.61.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.61.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.61.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.62.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.62.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.62.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.63.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.63.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.63.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.64.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.64.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.64.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.65.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.65.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.65.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.66.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.66.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.66.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.67.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.67.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.67.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.68.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.68.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.68.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.69.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.69.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.69.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.7.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.7.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.7.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.70.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.70.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.70.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.71.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.71.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.71.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.72.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.72.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.72.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.73.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.73.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.73.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.74.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.74.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.74.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.75.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.75.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.75.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.76.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.76.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.76.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.77.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.77.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.77.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.78.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.78.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.78.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.79.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.79.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.79.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.8.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.8.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.8.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.80.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.80.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.80.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.81.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.81.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.81.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.82.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.82.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.82.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.83.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.83.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.83.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.84.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.84.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.84.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.85.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.85.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.85.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.86.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.86.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.86.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.87.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.87.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.87.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.88.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.88.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.88.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.89.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.89.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.89.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.9.down_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.9.gate_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.9.up_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.mlp.experts.90.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.90.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.90.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.91.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.91.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.91.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.92.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.92.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.92.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.93.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.93.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.93.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.94.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.94.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.94.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.95.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.95.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.95.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.96.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.96.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.96.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.97.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.97.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.97.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.98.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.98.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.98.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.99.down_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.99.gate_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.experts.99.up_proj.weight": "model-00070-of-00142.safetensors", + "model.layers.46.mlp.gate.e_score_correction_bias": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.gate.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.shared_experts.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.shared_experts.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.mlp.shared_experts.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.46.post_attention_layernorm.weight": "model-00071-of-00142.safetensors", + "model.layers.46.self_attn.k_norm.weight": "model-00069-of-00142.safetensors", + "model.layers.46.self_attn.k_proj.bias": "model-00069-of-00142.safetensors", + "model.layers.46.self_attn.k_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.self_attn.o_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.self_attn.q_norm.weight": "model-00069-of-00142.safetensors", + "model.layers.46.self_attn.q_proj.bias": "model-00069-of-00142.safetensors", + "model.layers.46.self_attn.q_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.46.self_attn.v_proj.bias": "model-00069-of-00142.safetensors", + "model.layers.46.self_attn.v_proj.weight": "model-00069-of-00142.safetensors", + "model.layers.47.input_layernorm.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.0.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.0.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.0.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.1.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.1.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.1.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.10.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.10.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.10.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.100.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.100.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.100.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.101.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.101.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.101.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.102.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.102.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.102.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.103.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.103.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.103.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.104.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.104.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.104.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.105.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.105.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.105.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.106.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.106.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.106.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.107.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.107.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.107.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.108.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.108.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.108.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.109.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.109.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.109.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.11.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.11.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.11.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.110.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.110.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.110.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.111.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.111.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.111.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.112.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.112.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.112.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.113.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.113.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.113.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.114.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.114.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.114.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.115.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.115.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.115.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.116.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.116.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.116.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.117.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.117.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.117.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.118.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.118.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.118.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.119.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.119.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.119.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.12.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.12.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.12.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.120.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.120.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.120.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.121.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.121.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.121.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.122.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.122.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.122.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.123.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.123.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.123.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.124.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.124.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.124.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.125.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.125.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.125.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.126.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.126.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.126.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.127.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.127.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.127.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.128.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.128.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.128.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.129.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.129.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.129.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.13.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.13.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.13.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.130.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.130.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.130.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.131.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.131.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.131.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.132.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.132.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.132.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.133.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.133.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.133.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.134.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.134.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.134.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.135.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.135.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.135.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.136.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.136.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.136.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.137.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.137.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.137.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.138.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.138.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.138.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.139.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.139.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.139.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.14.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.14.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.14.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.140.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.140.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.140.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.141.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.141.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.141.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.142.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.142.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.142.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.143.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.143.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.143.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.144.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.144.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.144.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.145.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.145.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.145.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.146.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.146.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.146.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.147.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.147.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.147.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.148.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.148.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.148.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.149.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.149.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.149.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.15.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.15.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.15.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.150.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.150.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.150.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.151.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.151.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.151.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.152.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.152.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.152.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.153.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.153.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.153.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.154.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.154.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.154.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.155.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.155.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.155.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.156.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.156.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.156.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.157.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.157.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.157.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.158.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.158.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.158.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.159.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.159.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.159.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.16.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.16.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.16.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.17.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.17.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.17.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.18.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.18.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.18.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.19.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.19.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.19.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.2.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.2.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.2.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.20.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.20.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.20.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.21.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.21.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.21.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.22.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.22.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.22.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.23.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.23.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.23.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.24.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.24.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.24.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.25.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.25.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.25.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.26.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.26.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.26.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.27.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.27.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.27.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.28.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.28.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.28.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.29.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.29.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.29.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.3.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.3.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.3.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.30.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.30.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.30.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.31.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.31.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.31.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.32.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.32.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.32.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.33.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.33.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.33.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.34.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.34.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.34.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.35.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.35.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.35.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.36.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.36.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.36.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.37.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.37.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.37.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.38.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.38.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.38.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.39.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.39.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.39.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.4.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.4.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.4.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.40.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.40.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.40.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.41.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.41.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.41.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.42.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.42.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.42.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.43.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.43.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.43.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.44.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.44.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.44.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.45.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.45.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.45.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.46.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.46.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.46.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.47.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.47.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.47.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.48.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.48.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.48.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.49.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.49.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.49.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.5.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.5.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.5.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.50.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.50.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.50.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.51.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.51.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.51.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.52.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.52.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.52.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.53.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.53.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.53.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.54.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.54.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.54.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.55.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.55.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.55.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.56.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.56.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.56.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.57.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.57.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.57.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.58.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.58.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.58.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.59.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.59.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.59.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.6.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.6.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.6.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.60.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.60.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.60.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.61.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.61.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.61.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.62.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.62.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.62.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.63.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.63.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.63.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.64.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.64.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.64.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.65.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.65.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.65.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.66.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.66.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.66.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.67.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.67.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.67.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.68.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.68.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.68.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.69.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.69.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.69.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.7.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.7.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.7.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.70.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.70.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.70.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.71.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.71.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.71.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.72.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.72.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.72.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.73.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.73.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.73.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.74.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.74.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.74.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.75.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.75.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.75.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.76.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.76.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.76.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.77.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.77.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.77.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.78.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.78.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.78.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.79.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.79.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.79.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.8.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.8.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.8.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.80.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.80.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.80.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.81.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.81.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.81.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.82.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.82.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.82.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.83.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.83.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.83.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.84.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.84.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.84.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.85.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.85.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.85.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.86.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.86.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.86.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.87.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.87.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.87.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.88.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.88.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.88.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.89.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.89.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.89.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.9.down_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.9.gate_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.9.up_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.mlp.experts.90.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.90.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.90.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.91.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.91.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.91.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.92.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.92.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.92.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.93.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.93.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.93.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.94.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.94.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.94.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.95.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.95.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.95.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.96.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.96.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.96.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.97.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.97.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.97.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.98.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.98.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.98.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.99.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.99.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.experts.99.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.gate.e_score_correction_bias": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.gate.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.shared_experts.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.shared_experts.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.mlp.shared_experts.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.47.post_attention_layernorm.weight": "model-00072-of-00142.safetensors", + "model.layers.47.self_attn.k_norm.weight": "model-00071-of-00142.safetensors", + "model.layers.47.self_attn.k_proj.bias": "model-00071-of-00142.safetensors", + "model.layers.47.self_attn.k_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.self_attn.o_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.self_attn.q_norm.weight": "model-00071-of-00142.safetensors", + "model.layers.47.self_attn.q_proj.bias": "model-00071-of-00142.safetensors", + "model.layers.47.self_attn.q_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.47.self_attn.v_proj.bias": "model-00071-of-00142.safetensors", + "model.layers.47.self_attn.v_proj.weight": "model-00071-of-00142.safetensors", + "model.layers.48.input_layernorm.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.0.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.0.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.0.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.1.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.1.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.1.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.10.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.10.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.10.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.100.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.100.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.100.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.101.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.101.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.101.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.102.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.102.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.102.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.103.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.103.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.103.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.104.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.104.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.104.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.105.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.105.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.105.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.106.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.106.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.106.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.107.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.107.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.107.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.108.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.108.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.108.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.109.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.109.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.109.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.11.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.11.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.11.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.110.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.110.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.110.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.111.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.111.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.111.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.112.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.112.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.112.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.113.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.113.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.113.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.114.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.114.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.114.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.115.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.115.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.115.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.116.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.116.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.116.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.117.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.117.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.117.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.118.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.118.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.118.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.119.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.119.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.119.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.12.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.12.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.12.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.120.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.120.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.120.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.121.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.121.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.121.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.122.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.122.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.122.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.123.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.123.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.123.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.124.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.124.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.124.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.125.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.125.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.125.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.126.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.126.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.126.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.127.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.127.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.127.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.128.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.128.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.128.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.129.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.129.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.129.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.13.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.13.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.13.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.130.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.130.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.130.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.131.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.131.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.131.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.132.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.132.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.132.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.133.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.133.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.133.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.134.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.134.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.134.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.135.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.135.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.135.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.136.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.136.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.136.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.137.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.137.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.137.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.138.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.138.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.138.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.139.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.139.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.139.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.14.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.14.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.14.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.140.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.140.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.140.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.141.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.141.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.141.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.142.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.142.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.142.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.143.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.143.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.143.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.144.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.144.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.144.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.145.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.145.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.145.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.146.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.146.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.146.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.147.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.147.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.147.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.148.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.148.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.148.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.149.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.149.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.149.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.15.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.15.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.15.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.150.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.150.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.150.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.151.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.151.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.151.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.152.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.152.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.152.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.153.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.153.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.153.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.154.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.154.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.154.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.155.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.155.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.155.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.156.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.156.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.156.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.157.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.157.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.157.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.158.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.158.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.158.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.159.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.159.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.159.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.experts.16.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.16.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.16.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.17.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.17.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.17.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.18.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.18.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.18.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.19.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.19.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.19.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.2.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.2.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.2.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.20.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.20.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.20.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.21.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.21.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.21.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.22.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.22.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.22.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.23.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.23.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.23.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.24.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.24.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.24.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.25.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.25.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.25.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.26.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.26.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.26.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.27.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.27.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.27.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.28.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.28.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.28.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.29.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.29.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.29.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.3.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.3.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.3.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.30.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.30.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.30.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.31.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.31.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.31.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.32.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.32.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.32.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.33.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.33.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.33.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.34.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.34.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.34.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.35.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.35.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.35.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.36.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.36.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.36.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.37.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.37.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.37.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.38.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.38.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.38.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.39.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.39.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.39.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.4.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.4.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.4.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.40.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.40.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.40.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.41.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.41.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.41.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.42.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.42.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.42.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.43.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.43.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.43.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.44.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.44.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.44.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.45.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.45.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.45.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.46.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.46.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.46.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.47.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.47.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.47.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.48.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.48.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.48.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.49.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.49.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.49.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.5.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.5.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.5.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.50.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.50.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.50.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.51.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.51.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.51.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.52.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.52.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.52.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.53.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.53.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.53.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.54.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.54.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.54.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.55.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.55.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.55.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.56.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.56.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.56.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.57.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.57.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.57.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.58.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.58.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.58.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.59.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.59.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.59.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.6.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.6.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.6.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.60.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.60.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.60.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.61.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.61.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.61.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.62.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.62.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.62.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.63.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.63.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.63.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.64.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.64.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.64.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.65.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.65.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.65.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.66.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.66.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.66.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.67.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.67.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.67.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.68.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.68.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.68.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.69.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.69.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.69.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.7.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.7.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.7.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.70.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.70.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.70.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.71.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.71.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.71.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.72.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.72.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.72.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.73.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.73.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.73.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.74.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.74.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.74.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.75.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.75.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.75.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.76.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.76.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.76.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.77.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.77.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.77.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.78.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.78.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.78.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.79.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.79.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.79.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.8.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.8.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.8.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.80.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.80.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.80.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.81.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.81.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.81.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.82.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.82.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.82.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.83.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.83.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.83.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.84.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.84.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.84.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.85.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.85.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.85.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.86.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.86.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.86.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.87.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.87.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.87.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.88.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.88.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.88.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.89.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.89.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.89.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.9.down_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.9.gate_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.9.up_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.mlp.experts.90.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.90.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.90.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.91.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.91.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.91.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.92.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.92.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.92.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.93.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.93.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.93.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.94.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.94.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.94.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.95.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.95.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.95.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.96.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.96.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.96.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.97.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.97.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.97.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.98.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.98.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.98.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.99.down_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.99.gate_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.experts.99.up_proj.weight": "model-00073-of-00142.safetensors", + "model.layers.48.mlp.gate.e_score_correction_bias": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.gate.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.shared_experts.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.shared_experts.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.mlp.shared_experts.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.48.post_attention_layernorm.weight": "model-00074-of-00142.safetensors", + "model.layers.48.self_attn.k_norm.weight": "model-00072-of-00142.safetensors", + "model.layers.48.self_attn.k_proj.bias": "model-00072-of-00142.safetensors", + "model.layers.48.self_attn.k_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.self_attn.o_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.self_attn.q_norm.weight": "model-00072-of-00142.safetensors", + "model.layers.48.self_attn.q_proj.bias": "model-00072-of-00142.safetensors", + "model.layers.48.self_attn.q_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.48.self_attn.v_proj.bias": "model-00072-of-00142.safetensors", + "model.layers.48.self_attn.v_proj.weight": "model-00072-of-00142.safetensors", + "model.layers.49.input_layernorm.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.0.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.0.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.0.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.1.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.1.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.1.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.10.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.10.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.10.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.100.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.100.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.100.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.101.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.101.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.101.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.102.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.102.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.102.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.103.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.103.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.103.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.104.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.104.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.104.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.105.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.105.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.105.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.106.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.106.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.106.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.107.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.107.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.107.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.108.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.108.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.108.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.109.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.109.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.109.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.11.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.11.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.11.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.110.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.110.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.110.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.111.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.111.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.111.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.112.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.112.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.112.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.113.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.113.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.113.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.114.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.114.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.114.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.115.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.115.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.115.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.116.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.116.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.116.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.117.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.117.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.117.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.118.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.118.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.118.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.119.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.119.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.119.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.12.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.12.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.12.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.120.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.120.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.120.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.121.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.121.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.121.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.122.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.122.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.122.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.123.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.123.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.123.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.124.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.124.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.124.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.125.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.125.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.125.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.126.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.126.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.126.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.127.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.127.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.127.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.128.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.128.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.128.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.129.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.129.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.129.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.13.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.13.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.13.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.130.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.130.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.130.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.131.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.131.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.131.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.132.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.132.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.132.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.133.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.133.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.133.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.134.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.134.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.134.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.135.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.135.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.135.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.136.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.136.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.136.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.137.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.137.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.137.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.138.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.138.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.138.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.139.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.139.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.139.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.14.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.14.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.14.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.140.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.140.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.140.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.141.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.141.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.141.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.142.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.142.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.142.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.143.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.143.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.143.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.144.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.144.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.144.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.145.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.145.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.145.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.146.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.146.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.146.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.147.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.147.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.147.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.148.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.148.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.148.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.149.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.149.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.149.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.15.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.15.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.15.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.150.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.150.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.150.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.151.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.151.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.151.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.152.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.152.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.152.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.153.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.153.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.153.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.154.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.154.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.154.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.155.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.155.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.155.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.156.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.156.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.156.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.157.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.157.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.157.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.158.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.158.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.158.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.159.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.159.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.159.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.16.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.16.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.16.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.17.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.17.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.17.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.18.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.18.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.18.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.19.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.19.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.19.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.2.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.2.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.2.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.20.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.20.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.20.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.21.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.21.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.21.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.22.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.22.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.22.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.23.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.23.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.23.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.24.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.24.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.24.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.25.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.25.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.25.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.26.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.26.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.26.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.27.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.27.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.27.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.28.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.28.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.28.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.29.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.29.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.29.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.3.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.3.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.3.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.30.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.30.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.30.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.31.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.31.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.31.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.32.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.32.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.32.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.33.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.33.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.33.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.34.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.34.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.34.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.35.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.35.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.35.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.36.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.36.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.36.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.37.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.37.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.37.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.38.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.38.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.38.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.39.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.39.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.39.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.4.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.4.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.4.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.40.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.40.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.40.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.41.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.41.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.41.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.42.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.42.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.42.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.43.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.43.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.43.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.44.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.44.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.44.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.45.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.45.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.45.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.46.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.46.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.46.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.47.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.47.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.47.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.48.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.48.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.48.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.49.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.49.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.49.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.5.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.5.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.5.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.50.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.50.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.50.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.51.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.51.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.51.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.52.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.52.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.52.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.53.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.53.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.53.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.54.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.54.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.54.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.55.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.55.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.55.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.56.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.56.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.56.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.57.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.57.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.57.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.58.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.58.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.58.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.59.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.59.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.59.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.6.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.6.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.6.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.60.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.60.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.60.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.61.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.61.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.61.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.62.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.62.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.62.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.63.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.63.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.63.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.64.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.64.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.64.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.65.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.65.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.65.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.66.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.66.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.66.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.67.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.67.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.67.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.68.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.68.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.68.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.69.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.69.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.69.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.7.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.7.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.7.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.70.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.70.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.70.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.71.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.71.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.71.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.72.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.72.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.72.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.73.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.73.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.73.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.74.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.74.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.74.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.75.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.75.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.75.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.76.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.76.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.76.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.77.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.77.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.77.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.78.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.78.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.78.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.79.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.79.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.79.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.8.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.8.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.8.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.80.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.80.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.80.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.81.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.81.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.81.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.82.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.82.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.82.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.83.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.83.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.83.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.84.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.84.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.84.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.85.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.85.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.85.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.86.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.86.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.86.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.87.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.87.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.87.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.88.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.88.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.88.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.89.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.89.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.89.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.9.down_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.9.gate_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.9.up_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.mlp.experts.90.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.90.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.90.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.91.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.91.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.91.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.92.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.92.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.92.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.93.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.93.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.93.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.94.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.94.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.94.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.95.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.95.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.95.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.96.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.96.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.96.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.97.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.97.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.97.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.98.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.98.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.98.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.99.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.99.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.experts.99.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.gate.e_score_correction_bias": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.gate.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.shared_experts.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.shared_experts.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.mlp.shared_experts.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.49.post_attention_layernorm.weight": "model-00075-of-00142.safetensors", + "model.layers.49.self_attn.k_norm.weight": "model-00074-of-00142.safetensors", + "model.layers.49.self_attn.k_proj.bias": "model-00074-of-00142.safetensors", + "model.layers.49.self_attn.k_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.self_attn.o_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.self_attn.q_norm.weight": "model-00074-of-00142.safetensors", + "model.layers.49.self_attn.q_proj.bias": "model-00074-of-00142.safetensors", + "model.layers.49.self_attn.q_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.49.self_attn.v_proj.bias": "model-00074-of-00142.safetensors", + "model.layers.49.self_attn.v_proj.weight": "model-00074-of-00142.safetensors", + "model.layers.5.input_layernorm.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.0.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.0.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.1.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.1.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.10.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.10.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.10.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.100.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.100.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.100.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.101.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.101.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.101.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.102.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.102.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.102.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.103.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.103.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.103.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.104.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.104.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.104.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.105.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.105.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.105.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.106.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.106.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.106.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.107.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.107.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.107.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.108.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.108.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.108.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.109.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.109.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.109.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.11.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.11.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.11.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.110.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.110.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.110.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.111.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.111.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.111.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.112.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.112.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.112.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.113.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.113.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.113.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.114.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.114.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.114.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.115.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.115.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.115.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.116.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.116.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.116.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.117.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.117.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.117.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.118.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.118.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.118.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.119.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.119.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.119.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.12.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.12.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.12.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.120.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.120.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.120.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.121.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.121.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.121.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.122.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.122.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.122.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.123.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.123.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.123.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.124.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.124.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.124.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.125.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.125.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.125.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.126.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.126.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.126.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.127.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.127.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.127.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.128.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.128.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.128.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.129.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.129.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.129.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.13.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.13.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.13.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.130.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.130.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.130.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.131.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.131.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.131.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.132.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.132.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.132.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.133.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.133.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.133.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.134.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.134.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.134.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.135.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.135.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.135.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.136.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.136.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.136.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.137.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.137.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.137.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.138.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.138.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.138.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.139.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.139.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.139.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.14.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.14.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.14.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.140.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.140.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.140.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.141.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.141.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.141.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.142.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.142.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.142.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.143.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.143.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.143.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.144.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.144.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.144.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.145.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.145.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.145.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.146.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.146.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.146.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.147.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.147.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.147.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.148.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.148.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.148.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.149.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.149.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.149.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.15.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.15.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.15.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.150.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.150.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.150.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.151.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.151.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.151.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.152.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.152.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.152.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.153.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.153.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.153.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.154.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.154.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.154.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.155.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.155.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.155.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.156.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.156.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.156.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.157.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.157.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.157.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.158.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.158.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.158.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.159.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.159.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.159.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.experts.16.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.16.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.16.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.17.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.17.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.17.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.18.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.18.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.18.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.19.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.19.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.19.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.2.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.2.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.20.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.20.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.20.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.21.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.21.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.21.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.22.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.22.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.22.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.23.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.23.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.23.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.24.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.24.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.24.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.25.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.25.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.25.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.26.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.26.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.26.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.27.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.27.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.27.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.28.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.28.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.28.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.29.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.29.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.29.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.3.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.3.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.30.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.30.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.30.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.31.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.31.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.31.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.32.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.32.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.32.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.33.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.33.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.33.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.34.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.34.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.34.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.35.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.35.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.35.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.36.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.36.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.36.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.37.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.37.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.37.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.38.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.38.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.38.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.39.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.39.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.39.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.4.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.4.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.40.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.40.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.40.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.41.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.41.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.41.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.42.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.42.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.42.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.43.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.43.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.43.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.44.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.44.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.44.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.45.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.45.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.45.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.46.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.46.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.46.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.47.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.47.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.47.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.48.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.48.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.48.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.49.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.49.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.49.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.5.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.5.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.50.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.50.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.50.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.51.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.51.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.51.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.52.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.52.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.52.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.53.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.53.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.53.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.54.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.54.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.54.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.55.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.55.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.55.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.56.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.56.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.56.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.57.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.57.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.57.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.58.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.58.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.58.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.59.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.59.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.59.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.6.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.6.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.60.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.60.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.60.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.61.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.61.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.61.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.62.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.62.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.62.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.63.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.63.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.64.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.64.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.65.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.65.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.65.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.66.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.66.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.66.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.67.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.67.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.67.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.68.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.68.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.68.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.69.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.69.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.69.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.7.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.7.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.70.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.70.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.70.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.71.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.71.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.71.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.72.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.72.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.72.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.73.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.73.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.73.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.74.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.74.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.74.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.75.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.75.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.75.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.76.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.76.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.76.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.77.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.77.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.77.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.78.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.78.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.78.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.79.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.79.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.79.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.8.down_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.8.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.8.up_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.80.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.80.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.80.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.81.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.81.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.81.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.82.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.82.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.82.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.83.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.83.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.83.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.84.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.84.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.84.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.85.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.85.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.85.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.86.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.86.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.86.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.87.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.87.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.87.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.88.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.88.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.88.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.89.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.89.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.89.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.9.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.9.gate_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.mlp.experts.9.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.90.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.90.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.90.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.91.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.91.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.91.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.92.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.92.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.92.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.93.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.93.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.93.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.94.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.94.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.94.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.95.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.95.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.95.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.96.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.96.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.96.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.97.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.97.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.97.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.98.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.98.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.98.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.99.down_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.99.gate_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.experts.99.up_proj.weight": "model-00005-of-00142.safetensors", + "model.layers.5.mlp.gate.e_score_correction_bias": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.gate.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.shared_experts.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.shared_experts.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.mlp.shared_experts.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00006-of-00142.safetensors", + "model.layers.5.self_attn.k_norm.weight": "model-00004-of-00142.safetensors", + "model.layers.5.self_attn.k_proj.bias": "model-00004-of-00142.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.self_attn.q_norm.weight": "model-00004-of-00142.safetensors", + "model.layers.5.self_attn.q_proj.bias": "model-00004-of-00142.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.5.self_attn.v_proj.bias": "model-00004-of-00142.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00004-of-00142.safetensors", + "model.layers.50.input_layernorm.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.0.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.0.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.0.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.1.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.1.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.1.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.10.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.10.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.10.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.100.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.100.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.100.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.101.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.101.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.101.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.102.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.102.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.102.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.103.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.103.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.103.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.104.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.104.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.104.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.105.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.105.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.105.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.106.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.106.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.106.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.107.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.107.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.107.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.108.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.108.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.108.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.109.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.109.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.109.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.11.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.11.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.11.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.110.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.110.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.110.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.111.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.111.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.111.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.112.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.112.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.112.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.113.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.113.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.113.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.114.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.114.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.114.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.115.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.115.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.115.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.116.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.116.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.116.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.117.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.117.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.117.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.118.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.118.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.118.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.119.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.119.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.119.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.12.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.12.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.12.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.120.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.120.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.120.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.121.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.121.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.121.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.122.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.122.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.122.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.123.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.123.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.123.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.124.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.124.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.124.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.125.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.125.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.125.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.126.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.126.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.126.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.127.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.127.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.127.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.128.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.128.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.128.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.129.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.129.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.129.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.13.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.13.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.13.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.130.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.130.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.130.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.131.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.131.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.131.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.132.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.132.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.132.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.133.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.133.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.133.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.134.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.134.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.134.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.135.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.135.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.135.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.136.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.136.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.136.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.137.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.137.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.137.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.138.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.138.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.138.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.139.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.139.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.139.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.14.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.14.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.14.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.140.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.140.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.140.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.141.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.141.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.141.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.142.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.142.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.142.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.143.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.143.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.143.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.144.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.144.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.144.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.145.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.145.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.145.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.146.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.146.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.146.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.147.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.147.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.147.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.148.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.148.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.148.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.149.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.149.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.149.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.15.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.15.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.15.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.150.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.150.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.150.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.151.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.151.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.151.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.152.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.152.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.152.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.153.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.153.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.153.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.154.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.154.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.154.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.155.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.155.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.155.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.156.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.156.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.156.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.157.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.157.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.157.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.158.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.158.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.158.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.159.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.159.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.159.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.experts.16.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.16.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.16.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.17.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.17.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.17.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.18.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.18.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.18.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.19.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.19.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.19.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.2.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.2.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.2.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.20.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.20.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.20.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.21.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.21.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.21.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.22.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.22.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.22.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.23.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.23.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.23.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.24.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.24.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.24.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.25.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.25.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.25.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.26.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.26.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.26.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.27.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.27.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.27.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.28.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.28.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.28.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.29.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.29.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.29.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.3.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.3.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.3.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.30.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.30.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.30.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.31.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.31.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.31.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.32.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.32.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.32.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.33.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.33.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.33.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.34.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.34.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.34.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.35.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.35.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.35.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.36.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.36.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.36.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.37.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.37.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.37.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.38.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.38.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.38.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.39.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.39.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.39.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.4.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.4.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.4.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.40.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.40.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.40.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.41.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.41.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.41.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.42.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.42.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.42.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.43.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.43.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.43.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.44.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.44.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.44.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.45.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.45.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.45.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.46.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.46.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.46.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.47.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.47.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.47.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.48.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.48.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.48.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.49.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.49.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.49.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.5.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.5.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.5.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.50.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.50.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.50.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.51.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.51.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.51.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.52.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.52.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.52.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.53.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.53.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.53.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.54.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.54.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.54.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.55.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.55.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.55.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.56.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.56.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.56.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.57.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.57.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.57.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.58.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.58.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.58.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.59.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.59.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.59.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.6.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.6.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.6.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.60.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.60.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.60.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.61.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.61.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.61.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.62.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.62.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.62.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.63.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.63.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.63.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.64.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.64.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.64.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.65.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.65.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.65.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.66.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.66.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.66.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.67.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.67.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.67.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.68.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.68.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.68.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.69.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.69.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.69.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.7.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.7.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.7.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.70.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.70.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.70.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.71.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.71.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.71.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.72.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.72.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.72.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.73.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.73.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.73.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.74.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.74.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.74.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.75.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.75.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.75.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.76.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.76.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.76.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.77.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.77.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.77.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.78.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.78.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.78.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.79.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.79.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.79.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.8.down_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.8.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.8.up_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.80.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.80.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.80.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.81.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.81.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.81.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.82.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.82.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.82.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.83.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.83.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.83.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.84.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.84.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.84.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.85.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.85.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.85.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.86.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.86.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.86.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.87.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.87.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.87.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.88.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.88.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.88.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.89.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.89.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.89.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.9.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.9.gate_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.mlp.experts.9.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.90.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.90.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.90.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.91.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.91.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.91.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.92.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.92.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.92.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.93.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.93.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.93.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.94.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.94.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.94.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.95.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.95.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.95.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.96.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.96.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.96.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.97.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.97.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.97.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.98.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.98.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.98.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.99.down_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.99.gate_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.experts.99.up_proj.weight": "model-00076-of-00142.safetensors", + "model.layers.50.mlp.gate.e_score_correction_bias": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.gate.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.shared_experts.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.shared_experts.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.mlp.shared_experts.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.50.post_attention_layernorm.weight": "model-00077-of-00142.safetensors", + "model.layers.50.self_attn.k_norm.weight": "model-00075-of-00142.safetensors", + "model.layers.50.self_attn.k_proj.bias": "model-00075-of-00142.safetensors", + "model.layers.50.self_attn.k_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.self_attn.o_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.self_attn.q_norm.weight": "model-00075-of-00142.safetensors", + "model.layers.50.self_attn.q_proj.bias": "model-00075-of-00142.safetensors", + "model.layers.50.self_attn.q_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.50.self_attn.v_proj.bias": "model-00075-of-00142.safetensors", + "model.layers.50.self_attn.v_proj.weight": "model-00075-of-00142.safetensors", + "model.layers.51.input_layernorm.weight": "model-00079-of-00142.safetensors", + "model.layers.51.mlp.experts.0.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.0.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.0.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.1.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.1.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.1.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.10.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.10.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.10.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.100.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.100.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.100.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.101.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.101.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.101.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.102.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.102.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.102.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.103.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.103.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.103.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.104.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.104.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.104.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.105.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.105.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.105.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.106.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.106.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.106.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.107.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.107.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.107.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.108.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.108.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.108.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.109.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.109.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.109.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.11.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.11.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.11.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.110.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.110.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.110.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.111.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.111.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.111.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.112.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.112.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.112.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.113.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.113.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.113.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.114.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.114.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.114.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.115.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.115.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.115.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.116.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.116.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.116.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.117.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.117.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.117.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.118.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.118.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.118.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.119.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.119.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.119.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.12.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.12.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.12.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.120.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.120.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.120.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.121.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.121.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.121.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.122.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.122.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.122.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.123.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.123.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.123.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.124.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.124.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.124.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.125.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.125.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.125.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.126.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.126.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.126.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.127.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.127.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.127.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.128.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.128.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.128.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.129.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.129.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.129.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.13.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.13.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.13.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.130.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.130.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.130.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.131.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.131.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.131.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.132.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.132.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.132.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.133.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.133.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.133.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.134.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.134.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.134.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.135.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.135.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.135.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.136.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.136.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.136.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.137.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.137.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.137.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.138.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.138.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.138.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.139.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.139.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.139.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.14.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.14.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.14.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.140.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.140.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.140.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.141.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.141.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.141.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.142.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.142.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.142.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.143.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.143.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.143.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.144.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.144.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.144.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.145.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.145.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.145.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.146.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.146.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.146.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.147.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.147.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.147.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.148.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.148.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.148.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.149.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.149.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.149.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.15.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.15.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.15.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.150.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.150.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.150.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.151.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.151.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.151.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.152.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.152.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.152.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.153.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.153.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.153.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.154.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.154.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.154.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.155.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.155.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.155.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.156.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.156.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.156.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.157.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.157.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.157.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.158.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.158.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.158.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.159.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.51.mlp.experts.159.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.159.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.16.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.16.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.16.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.17.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.17.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.17.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.18.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.18.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.18.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.19.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.19.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.19.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.2.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.2.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.2.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.20.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.20.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.20.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.21.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.21.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.21.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.22.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.22.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.22.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.23.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.23.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.23.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.24.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.24.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.24.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.25.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.25.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.25.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.26.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.26.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.26.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.27.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.27.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.27.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.28.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.28.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.28.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.29.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.29.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.29.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.3.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.3.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.3.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.30.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.30.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.30.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.31.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.31.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.31.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.32.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.32.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.32.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.33.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.33.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.33.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.34.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.34.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.34.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.35.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.35.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.35.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.36.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.36.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.36.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.37.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.37.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.37.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.38.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.38.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.38.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.39.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.39.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.39.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.4.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.4.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.4.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.40.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.40.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.40.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.41.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.41.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.41.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.42.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.42.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.42.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.43.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.43.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.43.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.44.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.44.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.44.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.45.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.45.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.45.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.46.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.46.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.46.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.47.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.47.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.47.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.48.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.48.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.48.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.49.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.49.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.49.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.5.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.5.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.5.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.50.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.50.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.50.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.51.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.51.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.51.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.52.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.52.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.52.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.53.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.53.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.53.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.54.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.54.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.54.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.55.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.55.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.55.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.56.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.56.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.56.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.57.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.57.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.57.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.58.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.58.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.58.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.59.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.59.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.59.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.6.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.6.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.6.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.60.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.60.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.60.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.61.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.61.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.61.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.62.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.62.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.62.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.63.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.63.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.63.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.64.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.64.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.64.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.65.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.65.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.65.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.66.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.66.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.66.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.67.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.67.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.67.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.68.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.68.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.68.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.69.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.69.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.69.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.7.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.7.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.7.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.70.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.70.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.70.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.71.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.71.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.71.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.72.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.72.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.72.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.73.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.73.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.73.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.74.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.74.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.74.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.75.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.75.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.75.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.76.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.76.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.76.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.77.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.77.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.77.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.78.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.78.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.78.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.79.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.79.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.79.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.8.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.8.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.8.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.80.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.80.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.80.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.81.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.81.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.81.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.82.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.82.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.82.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.83.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.83.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.83.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.84.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.84.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.84.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.85.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.85.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.85.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.86.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.86.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.86.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.87.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.87.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.87.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.88.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.88.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.88.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.89.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.89.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.89.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.9.down_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.9.gate_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.9.up_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.mlp.experts.90.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.90.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.90.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.91.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.91.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.91.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.92.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.92.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.92.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.93.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.93.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.93.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.94.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.94.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.94.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.95.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.95.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.95.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.96.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.96.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.96.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.97.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.97.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.97.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.98.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.98.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.98.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.99.down_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.99.gate_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.experts.99.up_proj.weight": "model-00078-of-00142.safetensors", + "model.layers.51.mlp.gate.e_score_correction_bias": "model-00079-of-00142.safetensors", + "model.layers.51.mlp.gate.weight": "model-00079-of-00142.safetensors", + "model.layers.51.mlp.shared_experts.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.51.mlp.shared_experts.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.51.mlp.shared_experts.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.51.post_attention_layernorm.weight": "model-00079-of-00142.safetensors", + "model.layers.51.self_attn.k_norm.weight": "model-00077-of-00142.safetensors", + "model.layers.51.self_attn.k_proj.bias": "model-00077-of-00142.safetensors", + "model.layers.51.self_attn.k_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.self_attn.o_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.self_attn.q_norm.weight": "model-00077-of-00142.safetensors", + "model.layers.51.self_attn.q_proj.bias": "model-00077-of-00142.safetensors", + "model.layers.51.self_attn.q_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.51.self_attn.v_proj.bias": "model-00077-of-00142.safetensors", + "model.layers.51.self_attn.v_proj.weight": "model-00077-of-00142.safetensors", + "model.layers.52.input_layernorm.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.0.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.0.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.0.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.1.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.1.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.1.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.10.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.10.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.10.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.100.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.100.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.100.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.101.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.101.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.101.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.102.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.102.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.102.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.103.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.103.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.103.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.104.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.104.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.104.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.105.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.105.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.105.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.106.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.106.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.106.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.107.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.107.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.107.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.108.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.108.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.108.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.109.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.109.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.109.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.11.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.11.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.11.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.110.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.110.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.110.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.111.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.111.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.111.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.112.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.112.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.112.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.113.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.113.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.113.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.114.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.114.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.114.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.115.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.115.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.115.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.116.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.116.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.116.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.117.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.117.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.117.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.118.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.118.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.118.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.119.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.119.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.119.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.12.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.12.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.12.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.120.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.120.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.120.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.121.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.121.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.121.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.122.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.122.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.122.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.123.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.123.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.123.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.124.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.124.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.124.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.125.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.125.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.125.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.126.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.126.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.126.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.127.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.127.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.127.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.128.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.128.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.128.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.129.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.129.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.129.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.13.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.13.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.13.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.130.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.130.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.130.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.131.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.131.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.131.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.132.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.132.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.132.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.133.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.133.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.133.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.134.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.134.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.134.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.135.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.135.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.135.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.136.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.136.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.136.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.137.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.137.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.137.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.138.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.138.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.138.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.139.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.139.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.139.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.14.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.14.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.14.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.140.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.140.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.140.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.141.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.141.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.141.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.142.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.142.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.142.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.143.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.143.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.143.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.144.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.144.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.144.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.145.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.145.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.145.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.146.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.146.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.146.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.147.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.147.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.147.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.148.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.148.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.148.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.149.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.149.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.149.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.15.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.15.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.15.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.150.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.150.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.150.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.151.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.151.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.151.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.152.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.152.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.152.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.153.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.153.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.153.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.154.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.154.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.154.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.155.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.155.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.155.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.156.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.156.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.156.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.157.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.157.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.157.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.158.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.158.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.158.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.159.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.159.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.159.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.16.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.16.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.16.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.17.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.17.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.17.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.18.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.18.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.18.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.19.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.19.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.19.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.2.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.2.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.2.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.20.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.20.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.20.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.21.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.21.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.21.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.22.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.22.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.22.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.23.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.23.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.23.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.24.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.24.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.24.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.25.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.25.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.25.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.26.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.26.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.26.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.27.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.27.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.27.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.28.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.28.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.28.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.29.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.29.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.29.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.3.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.3.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.3.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.30.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.30.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.30.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.31.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.31.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.31.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.32.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.32.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.32.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.33.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.33.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.33.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.34.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.34.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.34.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.35.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.35.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.35.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.36.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.36.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.36.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.37.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.37.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.37.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.38.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.38.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.38.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.39.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.39.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.39.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.4.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.4.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.4.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.40.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.40.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.40.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.41.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.41.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.41.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.42.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.42.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.42.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.43.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.43.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.43.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.44.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.44.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.44.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.45.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.45.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.45.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.46.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.46.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.46.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.47.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.47.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.47.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.48.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.48.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.48.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.49.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.49.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.49.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.5.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.5.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.5.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.50.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.50.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.50.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.51.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.51.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.51.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.52.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.52.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.52.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.53.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.53.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.53.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.54.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.54.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.54.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.55.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.55.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.55.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.56.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.56.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.56.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.57.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.57.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.57.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.58.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.58.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.58.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.59.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.59.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.59.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.6.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.6.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.6.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.60.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.60.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.60.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.61.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.61.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.61.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.62.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.62.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.62.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.63.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.63.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.63.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.64.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.64.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.64.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.65.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.65.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.65.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.66.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.66.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.66.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.67.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.67.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.67.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.68.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.68.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.68.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.69.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.69.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.69.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.7.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.7.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.7.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.70.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.70.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.70.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.71.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.71.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.71.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.72.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.72.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.72.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.73.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.73.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.73.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.74.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.74.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.74.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.75.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.75.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.75.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.76.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.76.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.76.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.77.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.77.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.77.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.78.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.78.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.78.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.79.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.79.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.79.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.8.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.8.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.8.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.80.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.80.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.80.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.81.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.81.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.81.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.82.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.82.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.82.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.83.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.83.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.83.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.84.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.84.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.84.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.85.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.85.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.85.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.86.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.86.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.86.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.87.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.87.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.87.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.88.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.88.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.88.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.89.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.89.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.89.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.9.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.9.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.9.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.90.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.90.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.90.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.91.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.91.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.91.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.92.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.92.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.92.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.93.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.93.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.93.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.94.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.94.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.94.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.95.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.95.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.95.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.96.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.96.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.96.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.97.down_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.97.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.97.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.98.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.98.gate_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.98.up_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.mlp.experts.99.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.99.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.experts.99.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.gate.e_score_correction_bias": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.gate.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.shared_experts.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.shared_experts.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.mlp.shared_experts.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.52.post_attention_layernorm.weight": "model-00080-of-00142.safetensors", + "model.layers.52.self_attn.k_norm.weight": "model-00079-of-00142.safetensors", + "model.layers.52.self_attn.k_proj.bias": "model-00079-of-00142.safetensors", + "model.layers.52.self_attn.k_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.self_attn.o_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.self_attn.q_norm.weight": "model-00079-of-00142.safetensors", + "model.layers.52.self_attn.q_proj.bias": "model-00079-of-00142.safetensors", + "model.layers.52.self_attn.q_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.52.self_attn.v_proj.bias": "model-00079-of-00142.safetensors", + "model.layers.52.self_attn.v_proj.weight": "model-00079-of-00142.safetensors", + "model.layers.53.input_layernorm.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.0.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.0.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.0.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.1.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.1.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.1.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.10.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.10.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.10.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.100.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.100.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.100.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.101.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.101.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.101.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.102.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.102.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.102.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.103.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.103.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.103.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.104.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.104.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.104.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.105.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.105.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.105.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.106.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.106.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.106.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.107.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.107.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.107.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.108.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.108.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.108.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.109.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.109.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.109.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.11.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.11.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.11.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.110.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.110.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.110.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.111.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.111.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.111.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.112.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.112.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.112.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.113.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.113.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.113.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.114.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.114.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.114.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.115.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.115.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.115.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.116.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.116.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.116.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.117.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.117.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.117.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.118.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.118.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.118.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.119.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.119.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.119.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.12.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.12.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.12.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.120.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.120.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.120.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.121.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.121.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.121.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.122.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.122.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.122.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.123.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.123.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.123.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.124.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.124.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.124.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.125.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.125.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.125.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.126.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.126.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.126.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.127.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.127.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.127.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.128.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.128.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.128.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.129.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.129.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.129.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.13.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.13.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.13.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.130.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.130.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.130.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.131.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.131.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.131.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.132.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.132.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.132.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.133.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.133.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.133.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.134.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.134.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.134.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.135.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.135.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.135.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.136.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.136.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.136.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.137.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.137.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.137.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.138.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.138.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.138.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.139.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.139.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.139.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.14.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.14.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.14.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.140.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.140.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.140.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.141.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.141.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.141.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.142.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.142.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.142.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.143.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.143.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.143.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.144.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.144.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.144.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.145.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.145.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.145.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.146.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.146.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.146.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.147.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.147.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.147.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.148.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.148.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.148.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.149.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.149.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.149.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.15.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.15.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.15.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.150.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.150.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.150.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.151.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.151.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.151.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.152.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.152.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.152.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.153.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.153.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.153.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.154.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.154.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.154.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.155.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.155.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.155.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.156.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.156.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.156.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.157.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.157.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.157.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.158.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.158.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.158.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.159.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.159.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.159.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.experts.16.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.16.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.16.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.17.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.17.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.17.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.18.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.18.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.18.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.19.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.19.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.19.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.2.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.2.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.2.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.20.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.20.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.20.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.21.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.21.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.21.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.22.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.22.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.22.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.23.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.23.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.23.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.24.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.24.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.24.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.25.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.25.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.25.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.26.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.26.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.26.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.27.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.27.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.27.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.28.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.28.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.28.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.29.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.29.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.29.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.3.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.3.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.3.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.30.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.30.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.30.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.31.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.31.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.31.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.32.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.32.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.32.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.33.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.33.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.33.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.34.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.34.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.34.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.35.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.35.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.35.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.36.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.36.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.36.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.37.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.37.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.37.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.38.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.38.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.38.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.39.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.39.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.39.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.4.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.4.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.4.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.40.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.40.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.40.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.41.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.41.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.41.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.42.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.42.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.42.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.43.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.43.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.43.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.44.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.44.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.44.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.45.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.45.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.45.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.46.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.46.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.46.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.47.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.47.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.47.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.48.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.48.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.48.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.49.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.49.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.49.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.5.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.5.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.5.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.50.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.50.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.50.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.51.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.51.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.51.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.52.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.52.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.52.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.53.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.53.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.53.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.54.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.54.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.54.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.55.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.55.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.55.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.56.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.56.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.56.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.57.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.57.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.57.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.58.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.58.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.58.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.59.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.59.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.59.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.6.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.6.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.6.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.60.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.60.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.60.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.61.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.61.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.61.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.62.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.62.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.62.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.63.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.63.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.63.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.64.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.64.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.64.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.65.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.65.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.65.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.66.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.66.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.66.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.67.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.67.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.67.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.68.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.68.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.68.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.69.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.69.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.69.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.7.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.7.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.7.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.70.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.70.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.70.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.71.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.71.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.71.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.72.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.72.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.72.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.73.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.73.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.73.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.74.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.74.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.74.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.75.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.75.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.75.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.76.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.76.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.76.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.77.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.77.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.77.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.78.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.78.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.78.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.79.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.79.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.79.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.8.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.8.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.8.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.80.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.80.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.80.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.81.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.81.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.81.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.82.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.82.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.82.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.83.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.83.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.83.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.84.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.84.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.84.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.85.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.85.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.85.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.86.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.86.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.86.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.87.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.87.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.87.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.88.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.88.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.88.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.89.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.89.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.89.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.9.down_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.9.gate_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.9.up_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.mlp.experts.90.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.90.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.90.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.91.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.91.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.91.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.92.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.92.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.92.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.93.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.93.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.93.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.94.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.94.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.94.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.95.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.95.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.95.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.96.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.96.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.96.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.97.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.97.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.97.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.98.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.98.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.98.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.99.down_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.99.gate_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.experts.99.up_proj.weight": "model-00081-of-00142.safetensors", + "model.layers.53.mlp.gate.e_score_correction_bias": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.gate.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.shared_experts.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.shared_experts.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.mlp.shared_experts.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.53.post_attention_layernorm.weight": "model-00082-of-00142.safetensors", + "model.layers.53.self_attn.k_norm.weight": "model-00080-of-00142.safetensors", + "model.layers.53.self_attn.k_proj.bias": "model-00080-of-00142.safetensors", + "model.layers.53.self_attn.k_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.self_attn.o_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.self_attn.q_norm.weight": "model-00080-of-00142.safetensors", + "model.layers.53.self_attn.q_proj.bias": "model-00080-of-00142.safetensors", + "model.layers.53.self_attn.q_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.53.self_attn.v_proj.bias": "model-00080-of-00142.safetensors", + "model.layers.53.self_attn.v_proj.weight": "model-00080-of-00142.safetensors", + "model.layers.54.input_layernorm.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.0.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.0.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.0.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.1.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.1.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.1.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.10.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.10.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.10.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.100.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.100.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.100.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.101.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.101.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.101.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.102.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.102.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.102.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.103.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.103.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.103.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.104.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.104.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.104.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.105.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.105.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.105.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.106.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.106.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.106.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.107.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.107.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.107.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.108.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.108.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.108.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.109.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.109.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.109.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.11.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.11.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.11.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.110.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.110.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.110.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.111.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.111.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.111.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.112.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.112.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.112.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.113.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.113.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.113.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.114.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.114.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.114.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.115.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.115.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.115.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.116.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.116.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.116.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.117.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.117.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.117.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.118.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.118.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.118.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.119.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.119.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.119.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.12.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.12.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.12.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.120.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.120.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.120.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.121.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.121.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.121.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.122.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.122.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.122.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.123.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.123.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.123.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.124.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.124.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.124.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.125.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.125.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.125.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.126.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.126.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.126.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.127.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.127.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.127.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.128.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.128.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.128.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.129.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.129.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.129.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.13.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.13.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.13.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.130.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.130.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.130.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.131.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.131.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.131.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.132.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.132.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.132.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.133.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.133.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.133.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.134.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.134.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.134.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.135.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.135.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.135.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.136.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.136.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.136.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.137.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.137.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.137.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.138.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.138.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.138.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.139.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.139.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.139.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.14.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.14.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.14.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.140.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.140.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.140.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.141.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.141.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.141.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.142.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.142.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.142.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.143.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.143.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.143.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.144.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.144.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.144.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.145.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.145.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.145.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.146.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.146.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.146.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.147.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.147.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.147.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.148.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.148.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.148.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.149.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.149.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.149.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.15.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.15.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.15.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.150.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.150.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.150.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.151.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.151.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.151.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.152.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.152.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.152.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.153.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.153.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.153.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.154.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.154.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.154.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.155.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.155.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.155.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.156.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.156.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.156.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.157.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.157.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.157.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.158.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.158.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.158.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.159.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.159.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.159.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.16.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.16.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.16.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.17.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.17.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.17.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.18.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.18.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.18.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.19.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.19.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.19.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.2.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.2.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.2.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.20.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.20.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.20.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.21.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.21.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.21.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.22.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.22.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.22.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.23.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.23.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.23.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.24.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.24.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.24.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.25.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.25.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.25.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.26.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.26.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.26.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.27.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.27.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.27.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.28.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.28.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.28.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.29.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.29.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.29.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.3.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.3.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.3.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.30.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.30.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.30.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.31.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.31.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.31.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.32.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.32.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.32.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.33.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.33.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.33.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.34.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.34.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.34.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.35.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.35.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.35.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.36.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.36.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.36.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.37.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.37.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.37.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.38.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.38.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.38.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.39.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.39.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.39.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.4.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.4.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.4.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.40.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.40.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.40.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.41.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.41.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.41.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.42.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.42.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.42.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.43.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.43.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.43.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.44.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.44.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.44.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.45.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.45.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.45.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.46.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.46.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.46.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.47.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.47.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.47.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.48.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.48.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.48.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.49.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.49.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.49.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.5.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.5.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.5.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.50.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.50.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.50.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.51.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.51.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.51.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.52.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.52.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.52.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.53.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.53.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.53.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.54.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.54.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.54.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.55.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.55.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.55.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.56.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.56.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.56.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.57.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.57.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.57.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.58.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.58.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.58.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.59.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.59.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.59.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.6.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.6.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.6.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.60.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.60.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.60.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.61.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.61.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.61.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.62.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.62.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.62.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.63.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.63.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.63.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.64.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.64.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.64.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.65.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.65.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.65.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.66.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.66.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.66.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.67.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.67.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.67.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.68.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.68.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.68.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.69.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.69.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.69.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.7.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.7.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.7.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.70.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.70.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.70.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.71.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.71.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.71.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.72.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.72.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.72.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.73.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.73.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.73.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.74.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.74.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.74.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.75.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.75.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.75.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.76.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.76.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.76.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.77.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.77.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.77.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.78.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.78.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.78.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.79.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.79.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.79.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.8.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.8.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.8.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.80.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.80.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.80.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.81.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.81.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.81.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.82.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.82.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.82.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.83.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.83.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.83.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.84.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.84.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.84.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.85.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.85.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.85.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.86.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.86.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.86.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.87.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.87.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.87.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.88.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.88.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.88.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.89.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.89.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.89.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.9.down_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.9.gate_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.9.up_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.mlp.experts.90.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.90.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.90.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.91.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.91.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.91.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.92.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.92.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.92.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.93.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.93.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.93.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.94.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.94.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.94.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.95.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.95.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.95.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.96.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.96.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.96.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.97.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.97.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.97.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.98.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.98.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.98.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.99.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.99.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.experts.99.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.gate.e_score_correction_bias": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.gate.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.shared_experts.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.shared_experts.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.mlp.shared_experts.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.54.post_attention_layernorm.weight": "model-00083-of-00142.safetensors", + "model.layers.54.self_attn.k_norm.weight": "model-00082-of-00142.safetensors", + "model.layers.54.self_attn.k_proj.bias": "model-00082-of-00142.safetensors", + "model.layers.54.self_attn.k_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.self_attn.o_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.self_attn.q_norm.weight": "model-00082-of-00142.safetensors", + "model.layers.54.self_attn.q_proj.bias": "model-00082-of-00142.safetensors", + "model.layers.54.self_attn.q_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.54.self_attn.v_proj.bias": "model-00082-of-00142.safetensors", + "model.layers.54.self_attn.v_proj.weight": "model-00082-of-00142.safetensors", + "model.layers.55.input_layernorm.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.0.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.0.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.0.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.1.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.1.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.1.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.10.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.10.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.10.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.100.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.100.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.100.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.101.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.101.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.101.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.102.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.102.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.102.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.103.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.103.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.103.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.104.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.104.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.104.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.105.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.105.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.105.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.106.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.106.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.106.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.107.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.107.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.107.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.108.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.108.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.108.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.109.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.109.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.109.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.11.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.11.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.11.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.110.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.110.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.110.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.111.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.111.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.111.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.112.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.112.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.112.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.113.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.113.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.113.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.114.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.114.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.114.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.115.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.115.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.115.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.116.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.116.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.116.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.117.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.117.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.117.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.118.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.118.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.118.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.119.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.119.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.119.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.12.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.12.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.12.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.120.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.120.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.120.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.121.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.121.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.121.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.122.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.122.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.122.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.123.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.123.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.123.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.124.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.124.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.124.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.125.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.125.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.125.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.126.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.126.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.126.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.127.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.127.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.127.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.128.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.128.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.128.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.129.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.129.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.129.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.13.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.13.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.13.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.130.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.130.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.130.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.131.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.131.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.131.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.132.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.132.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.132.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.133.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.133.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.133.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.134.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.134.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.134.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.135.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.135.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.135.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.136.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.136.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.136.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.137.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.137.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.137.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.138.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.138.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.138.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.139.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.139.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.139.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.14.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.14.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.14.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.140.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.140.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.140.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.141.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.141.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.141.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.142.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.142.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.142.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.143.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.143.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.143.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.144.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.144.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.144.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.145.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.145.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.145.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.146.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.146.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.146.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.147.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.147.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.147.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.148.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.148.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.148.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.149.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.149.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.149.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.15.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.15.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.15.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.150.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.150.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.150.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.151.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.151.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.151.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.152.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.152.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.152.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.153.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.153.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.153.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.154.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.154.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.154.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.155.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.155.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.155.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.156.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.156.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.156.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.157.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.157.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.157.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.158.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.158.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.158.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.159.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.159.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.159.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.experts.16.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.16.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.16.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.17.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.17.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.17.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.18.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.18.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.18.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.19.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.19.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.19.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.2.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.2.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.2.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.20.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.20.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.20.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.21.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.21.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.21.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.22.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.22.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.22.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.23.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.23.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.23.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.24.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.24.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.24.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.25.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.25.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.25.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.26.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.26.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.26.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.27.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.27.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.27.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.28.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.28.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.28.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.29.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.29.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.29.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.3.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.3.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.3.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.30.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.30.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.30.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.31.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.31.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.31.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.32.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.32.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.32.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.33.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.33.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.33.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.34.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.34.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.34.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.35.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.35.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.35.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.36.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.36.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.36.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.37.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.37.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.37.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.38.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.38.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.38.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.39.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.39.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.39.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.4.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.4.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.4.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.40.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.40.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.40.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.41.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.41.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.41.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.42.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.42.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.42.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.43.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.43.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.43.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.44.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.44.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.44.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.45.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.45.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.45.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.46.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.46.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.46.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.47.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.47.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.47.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.48.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.48.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.48.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.49.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.49.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.49.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.5.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.5.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.5.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.50.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.50.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.50.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.51.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.51.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.51.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.52.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.52.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.52.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.53.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.53.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.53.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.54.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.54.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.54.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.55.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.55.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.55.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.56.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.56.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.56.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.57.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.57.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.57.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.58.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.58.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.58.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.59.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.59.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.59.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.6.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.6.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.6.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.60.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.60.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.60.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.61.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.61.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.61.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.62.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.62.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.62.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.63.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.63.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.63.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.64.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.64.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.64.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.65.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.65.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.65.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.66.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.66.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.66.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.67.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.67.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.67.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.68.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.68.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.68.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.69.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.69.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.69.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.7.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.7.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.7.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.70.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.70.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.70.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.71.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.71.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.71.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.72.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.72.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.72.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.73.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.73.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.73.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.74.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.74.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.74.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.75.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.75.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.75.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.76.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.76.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.76.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.77.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.77.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.77.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.78.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.78.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.78.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.79.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.79.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.79.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.8.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.8.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.8.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.80.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.80.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.80.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.81.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.81.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.81.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.82.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.82.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.82.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.83.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.83.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.83.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.84.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.84.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.84.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.85.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.85.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.85.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.86.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.86.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.86.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.87.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.87.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.87.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.88.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.88.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.88.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.89.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.89.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.89.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.9.down_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.9.gate_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.9.up_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.mlp.experts.90.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.90.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.90.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.91.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.91.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.91.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.92.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.92.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.92.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.93.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.93.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.93.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.94.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.94.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.94.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.95.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.95.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.95.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.96.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.96.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.96.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.97.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.97.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.97.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.98.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.98.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.98.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.99.down_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.99.gate_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.experts.99.up_proj.weight": "model-00084-of-00142.safetensors", + "model.layers.55.mlp.gate.e_score_correction_bias": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.gate.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.shared_experts.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.shared_experts.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.mlp.shared_experts.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.55.post_attention_layernorm.weight": "model-00085-of-00142.safetensors", + "model.layers.55.self_attn.k_norm.weight": "model-00083-of-00142.safetensors", + "model.layers.55.self_attn.k_proj.bias": "model-00083-of-00142.safetensors", + "model.layers.55.self_attn.k_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.self_attn.o_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.self_attn.q_norm.weight": "model-00083-of-00142.safetensors", + "model.layers.55.self_attn.q_proj.bias": "model-00083-of-00142.safetensors", + "model.layers.55.self_attn.q_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.55.self_attn.v_proj.bias": "model-00083-of-00142.safetensors", + "model.layers.55.self_attn.v_proj.weight": "model-00083-of-00142.safetensors", + "model.layers.56.input_layernorm.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.0.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.0.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.0.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.1.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.1.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.1.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.10.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.10.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.10.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.100.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.100.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.100.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.101.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.101.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.101.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.102.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.102.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.102.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.103.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.103.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.103.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.104.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.104.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.104.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.105.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.105.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.105.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.106.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.106.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.106.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.107.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.107.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.107.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.108.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.108.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.108.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.109.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.109.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.109.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.11.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.11.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.11.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.110.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.110.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.110.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.111.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.111.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.111.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.112.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.112.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.112.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.113.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.113.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.113.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.114.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.114.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.114.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.115.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.115.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.115.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.116.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.116.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.116.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.117.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.117.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.117.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.118.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.118.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.118.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.119.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.119.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.119.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.12.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.12.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.12.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.120.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.120.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.120.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.121.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.121.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.121.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.122.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.122.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.122.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.123.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.123.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.123.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.124.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.124.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.124.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.125.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.125.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.125.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.126.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.126.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.126.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.127.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.127.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.127.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.128.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.128.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.128.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.129.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.129.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.129.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.13.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.13.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.13.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.130.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.130.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.130.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.131.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.131.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.131.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.132.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.132.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.132.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.133.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.133.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.133.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.134.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.134.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.134.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.135.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.135.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.135.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.136.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.136.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.136.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.137.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.137.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.137.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.138.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.138.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.138.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.139.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.139.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.139.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.14.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.14.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.14.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.140.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.140.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.140.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.141.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.141.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.141.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.142.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.142.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.142.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.143.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.143.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.143.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.144.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.144.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.144.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.145.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.145.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.145.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.146.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.146.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.146.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.147.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.147.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.147.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.148.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.148.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.148.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.149.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.149.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.149.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.15.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.15.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.15.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.150.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.150.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.150.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.151.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.151.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.151.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.152.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.152.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.152.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.153.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.153.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.153.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.154.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.154.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.154.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.155.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.155.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.155.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.156.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.156.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.156.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.157.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.157.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.157.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.158.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.158.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.158.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.159.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.159.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.159.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.16.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.16.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.16.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.17.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.17.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.17.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.18.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.18.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.18.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.19.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.19.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.19.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.2.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.2.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.2.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.20.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.20.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.20.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.21.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.21.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.21.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.22.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.22.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.22.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.23.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.23.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.23.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.24.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.24.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.24.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.25.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.25.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.25.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.26.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.26.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.26.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.27.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.27.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.27.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.28.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.28.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.28.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.29.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.29.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.29.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.3.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.3.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.3.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.30.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.30.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.30.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.31.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.31.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.31.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.32.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.32.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.32.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.33.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.33.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.33.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.34.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.34.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.34.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.35.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.35.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.35.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.36.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.36.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.36.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.37.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.37.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.37.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.38.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.38.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.38.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.39.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.39.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.39.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.4.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.4.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.4.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.40.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.40.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.40.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.41.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.41.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.41.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.42.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.42.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.42.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.43.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.43.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.43.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.44.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.44.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.44.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.45.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.45.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.45.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.46.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.46.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.46.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.47.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.47.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.47.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.48.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.48.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.48.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.49.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.49.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.49.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.5.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.5.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.5.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.50.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.50.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.50.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.51.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.51.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.51.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.52.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.52.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.52.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.53.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.53.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.53.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.54.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.54.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.54.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.55.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.55.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.55.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.56.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.56.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.56.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.57.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.57.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.57.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.58.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.58.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.58.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.59.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.59.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.59.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.6.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.6.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.6.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.60.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.60.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.60.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.61.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.61.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.61.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.62.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.62.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.62.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.63.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.63.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.63.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.64.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.64.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.64.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.65.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.65.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.65.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.66.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.66.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.66.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.67.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.67.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.67.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.68.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.68.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.68.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.69.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.69.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.69.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.7.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.7.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.7.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.70.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.70.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.70.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.71.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.71.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.71.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.72.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.72.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.72.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.73.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.73.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.73.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.74.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.74.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.74.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.75.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.75.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.75.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.76.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.76.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.76.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.77.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.77.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.77.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.78.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.78.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.78.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.79.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.79.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.79.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.8.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.8.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.8.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.80.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.80.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.80.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.81.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.81.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.81.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.82.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.82.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.82.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.83.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.83.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.83.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.84.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.84.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.84.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.85.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.85.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.85.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.86.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.86.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.86.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.87.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.87.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.87.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.88.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.88.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.88.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.89.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.89.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.89.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.9.down_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.9.gate_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.9.up_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.mlp.experts.90.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.90.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.90.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.91.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.91.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.91.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.92.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.92.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.92.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.93.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.93.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.93.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.94.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.94.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.94.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.95.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.95.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.95.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.96.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.96.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.96.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.97.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.97.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.97.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.98.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.98.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.98.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.99.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.99.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.experts.99.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.gate.e_score_correction_bias": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.gate.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.shared_experts.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.shared_experts.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.mlp.shared_experts.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.56.post_attention_layernorm.weight": "model-00086-of-00142.safetensors", + "model.layers.56.self_attn.k_norm.weight": "model-00085-of-00142.safetensors", + "model.layers.56.self_attn.k_proj.bias": "model-00085-of-00142.safetensors", + "model.layers.56.self_attn.k_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.self_attn.o_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.self_attn.q_norm.weight": "model-00085-of-00142.safetensors", + "model.layers.56.self_attn.q_proj.bias": "model-00085-of-00142.safetensors", + "model.layers.56.self_attn.q_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.56.self_attn.v_proj.bias": "model-00085-of-00142.safetensors", + "model.layers.56.self_attn.v_proj.weight": "model-00085-of-00142.safetensors", + "model.layers.57.input_layernorm.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.0.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.0.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.0.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.1.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.1.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.1.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.10.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.10.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.10.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.100.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.100.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.100.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.101.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.101.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.101.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.102.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.102.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.102.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.103.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.103.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.103.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.104.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.104.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.104.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.105.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.105.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.105.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.106.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.106.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.106.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.107.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.107.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.107.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.108.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.108.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.108.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.109.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.109.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.109.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.11.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.11.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.11.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.110.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.110.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.110.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.111.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.111.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.111.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.112.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.112.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.112.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.113.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.113.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.113.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.114.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.114.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.114.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.115.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.115.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.115.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.116.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.116.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.116.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.117.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.117.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.117.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.118.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.118.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.118.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.119.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.119.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.119.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.12.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.12.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.12.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.120.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.120.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.120.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.121.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.121.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.121.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.122.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.122.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.122.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.123.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.123.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.123.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.124.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.124.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.124.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.125.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.125.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.125.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.126.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.126.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.126.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.127.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.127.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.127.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.128.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.128.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.128.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.129.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.129.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.129.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.13.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.13.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.13.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.130.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.130.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.130.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.131.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.131.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.131.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.132.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.132.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.132.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.133.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.133.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.133.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.134.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.134.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.134.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.135.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.135.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.135.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.136.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.136.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.136.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.137.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.137.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.137.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.138.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.138.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.138.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.139.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.139.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.139.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.14.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.14.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.14.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.140.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.140.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.140.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.141.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.141.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.141.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.142.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.142.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.142.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.143.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.143.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.143.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.144.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.144.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.144.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.145.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.145.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.145.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.146.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.146.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.146.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.147.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.147.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.147.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.148.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.148.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.148.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.149.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.149.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.149.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.15.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.15.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.15.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.150.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.150.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.150.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.151.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.151.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.151.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.152.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.152.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.152.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.153.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.153.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.153.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.154.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.154.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.154.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.155.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.155.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.155.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.156.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.156.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.156.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.157.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.157.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.157.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.158.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.158.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.158.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.159.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.159.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.159.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.experts.16.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.16.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.16.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.17.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.17.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.17.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.18.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.18.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.18.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.19.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.19.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.19.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.2.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.2.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.2.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.20.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.20.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.20.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.21.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.21.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.21.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.22.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.22.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.22.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.23.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.23.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.23.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.24.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.24.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.24.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.25.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.25.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.25.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.26.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.26.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.26.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.27.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.27.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.27.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.28.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.28.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.28.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.29.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.29.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.29.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.3.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.3.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.3.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.30.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.30.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.30.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.31.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.31.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.31.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.32.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.32.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.32.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.33.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.33.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.33.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.34.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.34.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.34.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.35.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.35.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.35.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.36.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.36.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.36.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.37.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.37.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.37.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.38.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.38.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.38.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.39.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.39.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.39.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.4.down_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.4.gate_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.4.up_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.mlp.experts.40.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.40.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.40.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.41.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.41.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.41.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.42.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.42.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.42.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.43.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.43.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.43.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.44.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.44.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.44.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.45.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.45.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.45.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.46.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.46.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.46.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.47.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.47.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.47.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.48.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.48.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.48.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.49.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.49.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.49.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.5.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.5.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.5.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.50.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.50.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.50.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.51.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.51.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.51.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.52.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.52.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.52.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.53.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.53.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.53.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.54.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.54.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.54.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.55.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.55.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.55.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.56.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.56.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.56.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.57.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.57.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.57.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.58.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.58.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.58.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.59.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.59.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.59.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.6.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.6.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.6.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.60.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.60.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.60.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.61.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.61.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.61.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.62.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.62.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.62.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.63.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.63.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.63.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.64.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.64.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.64.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.65.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.65.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.65.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.66.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.66.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.66.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.67.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.67.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.67.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.68.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.68.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.68.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.69.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.69.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.69.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.7.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.7.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.7.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.70.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.70.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.70.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.71.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.71.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.71.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.72.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.72.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.72.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.73.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.73.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.73.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.74.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.74.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.74.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.75.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.75.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.75.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.76.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.76.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.76.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.77.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.77.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.77.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.78.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.78.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.78.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.79.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.79.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.79.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.8.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.8.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.8.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.80.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.80.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.80.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.81.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.81.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.81.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.82.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.82.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.82.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.83.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.83.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.83.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.84.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.84.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.84.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.85.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.85.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.85.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.86.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.86.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.86.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.87.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.87.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.87.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.88.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.88.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.88.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.89.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.89.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.89.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.9.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.9.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.9.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.90.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.90.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.90.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.91.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.91.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.91.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.92.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.92.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.92.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.93.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.93.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.93.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.94.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.94.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.94.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.95.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.95.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.95.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.96.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.96.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.96.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.97.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.97.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.97.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.98.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.98.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.98.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.99.down_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.99.gate_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.experts.99.up_proj.weight": "model-00087-of-00142.safetensors", + "model.layers.57.mlp.gate.e_score_correction_bias": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.gate.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.shared_experts.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.shared_experts.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.mlp.shared_experts.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.57.post_attention_layernorm.weight": "model-00088-of-00142.safetensors", + "model.layers.57.self_attn.k_norm.weight": "model-00086-of-00142.safetensors", + "model.layers.57.self_attn.k_proj.bias": "model-00086-of-00142.safetensors", + "model.layers.57.self_attn.k_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.self_attn.o_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.self_attn.q_norm.weight": "model-00086-of-00142.safetensors", + "model.layers.57.self_attn.q_proj.bias": "model-00086-of-00142.safetensors", + "model.layers.57.self_attn.q_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.57.self_attn.v_proj.bias": "model-00086-of-00142.safetensors", + "model.layers.57.self_attn.v_proj.weight": "model-00086-of-00142.safetensors", + "model.layers.58.input_layernorm.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.0.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.0.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.0.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.1.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.1.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.1.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.10.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.10.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.10.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.100.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.100.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.100.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.101.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.101.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.101.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.102.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.102.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.102.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.103.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.103.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.103.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.104.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.104.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.104.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.105.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.105.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.105.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.106.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.106.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.106.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.107.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.107.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.107.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.108.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.108.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.108.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.109.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.109.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.109.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.11.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.11.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.11.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.110.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.110.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.110.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.111.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.111.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.111.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.112.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.112.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.112.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.113.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.113.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.113.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.114.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.114.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.114.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.115.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.115.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.115.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.116.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.116.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.116.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.117.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.117.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.117.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.118.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.118.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.118.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.119.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.119.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.119.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.12.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.12.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.12.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.120.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.120.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.120.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.121.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.121.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.121.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.122.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.122.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.122.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.123.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.123.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.123.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.124.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.124.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.124.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.125.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.125.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.125.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.126.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.126.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.126.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.127.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.127.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.127.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.128.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.128.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.128.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.129.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.129.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.129.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.13.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.13.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.13.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.130.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.130.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.130.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.131.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.131.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.131.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.132.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.132.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.132.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.133.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.133.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.133.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.134.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.134.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.134.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.135.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.135.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.135.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.136.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.136.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.136.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.137.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.137.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.137.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.138.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.138.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.138.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.139.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.139.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.139.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.14.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.14.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.14.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.140.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.140.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.140.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.141.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.141.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.141.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.142.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.142.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.142.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.143.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.143.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.143.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.144.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.144.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.144.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.145.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.145.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.145.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.146.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.146.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.146.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.147.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.147.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.147.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.148.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.148.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.148.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.149.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.149.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.149.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.15.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.15.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.15.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.150.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.150.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.150.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.151.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.151.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.151.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.152.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.152.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.152.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.153.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.153.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.153.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.154.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.154.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.154.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.155.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.155.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.155.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.156.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.156.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.156.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.157.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.157.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.157.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.158.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.158.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.158.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.159.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.159.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.159.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.experts.16.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.16.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.16.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.17.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.17.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.17.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.18.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.18.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.18.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.19.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.19.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.19.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.2.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.2.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.2.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.20.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.20.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.20.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.21.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.21.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.21.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.22.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.22.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.22.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.23.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.23.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.23.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.24.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.24.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.24.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.25.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.25.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.25.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.26.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.26.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.26.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.27.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.27.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.27.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.28.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.28.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.28.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.29.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.29.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.29.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.3.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.3.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.3.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.30.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.30.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.30.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.31.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.31.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.31.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.32.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.32.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.32.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.33.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.33.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.33.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.34.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.34.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.34.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.35.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.35.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.35.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.36.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.36.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.36.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.37.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.37.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.37.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.38.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.38.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.38.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.39.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.39.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.39.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.4.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.4.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.4.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.40.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.40.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.40.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.41.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.41.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.41.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.42.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.42.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.42.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.43.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.43.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.43.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.44.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.44.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.44.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.45.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.45.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.45.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.46.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.46.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.46.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.47.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.47.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.47.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.48.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.48.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.48.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.49.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.49.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.49.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.5.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.5.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.5.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.50.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.50.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.50.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.51.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.51.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.51.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.52.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.52.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.52.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.53.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.53.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.53.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.54.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.54.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.54.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.55.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.55.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.55.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.56.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.56.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.56.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.57.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.57.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.57.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.58.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.58.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.58.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.59.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.59.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.59.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.6.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.6.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.6.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.60.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.60.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.60.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.61.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.61.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.61.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.62.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.62.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.62.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.63.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.63.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.63.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.64.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.64.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.64.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.65.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.65.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.65.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.66.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.66.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.66.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.67.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.67.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.67.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.68.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.68.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.68.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.69.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.69.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.69.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.7.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.7.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.7.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.70.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.70.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.70.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.71.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.71.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.71.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.72.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.72.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.72.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.73.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.73.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.73.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.74.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.74.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.74.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.75.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.75.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.75.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.76.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.76.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.76.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.77.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.77.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.77.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.78.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.78.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.78.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.79.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.79.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.79.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.8.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.8.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.8.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.80.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.80.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.80.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.81.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.81.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.81.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.82.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.82.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.82.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.83.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.83.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.83.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.84.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.84.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.84.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.85.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.85.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.85.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.86.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.86.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.86.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.87.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.87.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.87.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.88.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.88.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.88.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.89.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.89.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.89.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.9.down_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.9.gate_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.9.up_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.mlp.experts.90.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.90.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.90.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.91.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.91.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.91.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.92.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.92.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.92.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.93.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.93.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.93.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.94.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.94.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.94.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.95.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.95.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.95.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.96.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.96.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.96.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.97.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.97.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.97.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.98.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.98.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.98.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.99.down_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.99.gate_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.experts.99.up_proj.weight": "model-00089-of-00142.safetensors", + "model.layers.58.mlp.gate.e_score_correction_bias": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.gate.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.shared_experts.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.shared_experts.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.mlp.shared_experts.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.58.post_attention_layernorm.weight": "model-00090-of-00142.safetensors", + "model.layers.58.self_attn.k_norm.weight": "model-00088-of-00142.safetensors", + "model.layers.58.self_attn.k_proj.bias": "model-00088-of-00142.safetensors", + "model.layers.58.self_attn.k_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.self_attn.o_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.self_attn.q_norm.weight": "model-00088-of-00142.safetensors", + "model.layers.58.self_attn.q_proj.bias": "model-00088-of-00142.safetensors", + "model.layers.58.self_attn.q_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.58.self_attn.v_proj.bias": "model-00088-of-00142.safetensors", + "model.layers.58.self_attn.v_proj.weight": "model-00088-of-00142.safetensors", + "model.layers.59.input_layernorm.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.0.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.0.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.0.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.1.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.1.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.1.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.10.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.10.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.10.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.100.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.100.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.100.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.101.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.101.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.101.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.102.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.102.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.102.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.103.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.103.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.103.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.104.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.104.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.104.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.105.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.105.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.105.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.106.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.106.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.106.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.107.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.107.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.107.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.108.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.108.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.108.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.109.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.109.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.109.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.11.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.11.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.11.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.110.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.110.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.110.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.111.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.111.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.111.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.112.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.112.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.112.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.113.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.113.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.113.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.114.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.114.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.114.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.115.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.115.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.115.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.116.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.116.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.116.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.117.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.117.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.117.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.118.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.118.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.118.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.119.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.119.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.119.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.12.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.12.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.12.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.120.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.120.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.120.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.121.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.121.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.121.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.122.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.122.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.122.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.123.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.123.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.123.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.124.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.124.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.124.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.125.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.125.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.125.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.126.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.126.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.126.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.127.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.127.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.127.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.128.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.128.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.128.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.129.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.129.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.129.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.13.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.13.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.13.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.130.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.130.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.130.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.131.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.131.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.131.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.132.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.132.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.132.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.133.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.133.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.133.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.134.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.134.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.134.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.135.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.135.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.135.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.136.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.136.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.136.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.137.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.137.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.137.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.138.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.138.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.138.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.139.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.139.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.139.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.14.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.14.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.14.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.140.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.140.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.140.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.141.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.141.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.141.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.142.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.142.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.142.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.143.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.143.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.143.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.144.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.144.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.144.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.145.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.145.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.145.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.146.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.146.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.146.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.147.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.147.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.147.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.148.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.148.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.148.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.149.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.149.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.149.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.15.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.15.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.15.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.150.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.150.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.150.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.151.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.151.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.151.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.152.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.152.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.152.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.153.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.153.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.153.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.154.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.154.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.154.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.155.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.155.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.155.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.156.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.156.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.156.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.157.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.157.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.157.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.158.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.158.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.158.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.159.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.159.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.159.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.16.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.16.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.16.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.17.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.17.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.17.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.18.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.18.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.18.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.19.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.19.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.19.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.2.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.2.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.2.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.20.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.20.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.20.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.21.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.21.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.21.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.22.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.22.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.22.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.23.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.23.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.23.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.24.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.24.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.24.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.25.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.25.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.25.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.26.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.26.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.26.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.27.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.27.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.27.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.28.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.28.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.28.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.29.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.29.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.29.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.3.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.3.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.3.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.30.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.30.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.30.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.31.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.31.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.31.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.32.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.32.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.32.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.33.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.33.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.33.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.34.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.34.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.34.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.35.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.35.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.35.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.36.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.36.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.36.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.37.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.37.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.37.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.38.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.38.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.38.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.39.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.39.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.39.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.4.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.4.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.4.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.40.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.40.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.40.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.41.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.41.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.41.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.42.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.42.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.42.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.43.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.43.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.43.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.44.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.44.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.44.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.45.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.45.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.45.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.46.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.46.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.46.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.47.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.47.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.47.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.48.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.48.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.48.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.49.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.49.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.49.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.5.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.5.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.5.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.50.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.50.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.50.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.51.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.51.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.51.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.52.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.52.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.52.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.53.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.53.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.53.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.54.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.54.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.54.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.55.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.55.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.55.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.56.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.56.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.56.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.57.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.57.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.57.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.58.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.58.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.58.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.59.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.59.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.59.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.6.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.6.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.6.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.60.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.60.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.60.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.61.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.61.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.61.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.62.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.62.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.62.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.63.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.63.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.63.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.64.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.64.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.64.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.65.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.65.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.65.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.66.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.66.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.66.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.67.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.67.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.67.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.68.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.68.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.68.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.69.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.69.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.69.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.7.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.7.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.7.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.70.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.70.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.70.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.71.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.71.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.71.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.72.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.72.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.72.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.73.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.73.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.73.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.74.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.74.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.74.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.75.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.75.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.75.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.76.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.76.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.76.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.77.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.77.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.77.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.78.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.78.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.78.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.79.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.79.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.79.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.8.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.8.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.8.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.80.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.80.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.80.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.81.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.81.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.81.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.82.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.82.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.82.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.83.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.83.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.83.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.84.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.84.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.84.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.85.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.85.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.85.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.86.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.86.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.86.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.87.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.87.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.87.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.88.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.88.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.88.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.89.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.89.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.89.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.9.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.9.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.9.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.90.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.90.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.90.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.91.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.91.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.91.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.92.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.92.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.92.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.93.down_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.93.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.93.up_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.94.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.94.gate_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.mlp.experts.94.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.95.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.95.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.95.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.96.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.96.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.96.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.97.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.97.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.97.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.98.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.98.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.98.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.99.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.99.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.experts.99.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.gate.e_score_correction_bias": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.gate.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.shared_experts.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.shared_experts.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.mlp.shared_experts.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.59.post_attention_layernorm.weight": "model-00091-of-00142.safetensors", + "model.layers.59.self_attn.k_norm.weight": "model-00090-of-00142.safetensors", + "model.layers.59.self_attn.k_proj.bias": "model-00090-of-00142.safetensors", + "model.layers.59.self_attn.k_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.self_attn.o_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.self_attn.q_norm.weight": "model-00090-of-00142.safetensors", + "model.layers.59.self_attn.q_proj.bias": "model-00090-of-00142.safetensors", + "model.layers.59.self_attn.q_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.59.self_attn.v_proj.bias": "model-00090-of-00142.safetensors", + "model.layers.59.self_attn.v_proj.weight": "model-00090-of-00142.safetensors", + "model.layers.6.input_layernorm.weight": "model-00008-of-00142.safetensors", + "model.layers.6.mlp.experts.0.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.0.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.0.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.1.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.1.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.1.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.10.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.10.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.10.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.100.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.100.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.100.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.101.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.101.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.101.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.102.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.102.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.102.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.103.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.103.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.103.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.104.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.104.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.104.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.105.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.105.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.105.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.106.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.106.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.106.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.107.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.107.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.107.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.108.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.108.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.108.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.109.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.109.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.109.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.11.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.11.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.11.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.110.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.110.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.110.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.111.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.111.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.111.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.112.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.112.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.112.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.113.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.113.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.113.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.114.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.114.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.114.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.115.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.115.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.115.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.116.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.116.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.116.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.117.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.117.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.117.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.118.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.118.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.118.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.119.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.119.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.119.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.12.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.12.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.12.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.120.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.120.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.120.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.121.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.121.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.121.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.122.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.122.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.122.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.123.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.123.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.123.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.124.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.124.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.124.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.125.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.125.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.125.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.126.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.126.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.126.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.127.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.127.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.127.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.128.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.128.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.128.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.129.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.129.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.129.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.13.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.13.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.13.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.130.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.130.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.130.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.131.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.131.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.131.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.132.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.132.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.132.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.133.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.133.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.133.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.134.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.134.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.134.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.135.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.135.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.135.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.136.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.136.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.136.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.137.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.137.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.137.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.138.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.138.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.138.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.139.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.139.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.139.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.14.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.14.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.14.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.140.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.140.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.140.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.141.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.141.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.141.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.142.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.142.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.142.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.143.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.143.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.143.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.144.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.144.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.144.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.145.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.145.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.145.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.146.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.146.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.146.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.147.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.147.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.147.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.148.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.148.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.148.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.149.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.149.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.149.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.15.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.15.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.15.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.150.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.150.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.150.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.151.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.151.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.151.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.152.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.152.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.152.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.153.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.153.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.153.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.154.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.154.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.154.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.155.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.155.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.155.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.156.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.156.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.156.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.157.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.157.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.157.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.158.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.158.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.158.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.159.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.6.mlp.experts.159.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.159.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.16.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.16.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.16.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.17.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.17.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.17.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.18.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.18.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.18.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.19.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.19.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.19.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.2.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.2.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.2.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.20.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.20.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.20.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.21.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.21.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.21.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.22.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.22.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.22.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.23.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.23.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.23.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.24.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.24.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.24.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.25.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.25.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.25.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.26.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.26.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.26.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.27.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.27.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.27.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.28.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.28.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.28.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.29.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.29.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.29.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.3.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.3.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.3.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.30.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.30.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.30.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.31.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.31.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.31.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.32.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.32.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.32.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.33.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.33.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.33.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.34.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.34.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.34.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.35.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.35.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.35.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.36.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.36.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.36.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.37.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.37.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.37.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.38.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.38.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.38.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.39.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.39.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.39.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.4.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.4.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.4.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.40.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.40.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.40.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.41.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.41.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.41.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.42.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.42.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.42.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.43.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.43.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.43.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.44.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.44.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.44.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.45.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.45.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.45.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.46.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.46.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.46.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.47.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.47.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.47.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.48.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.48.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.48.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.49.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.49.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.49.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.5.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.5.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.5.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.50.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.50.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.50.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.51.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.51.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.51.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.52.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.52.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.52.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.53.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.53.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.53.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.54.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.54.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.54.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.55.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.55.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.55.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.56.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.56.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.56.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.57.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.57.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.57.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.58.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.58.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.58.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.59.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.59.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.59.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.6.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.6.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.6.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.60.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.60.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.60.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.61.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.61.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.61.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.62.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.62.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.62.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.63.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.63.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.64.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.64.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.65.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.65.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.65.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.66.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.66.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.66.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.67.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.67.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.67.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.68.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.68.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.68.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.69.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.69.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.69.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.7.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.7.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.70.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.70.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.70.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.71.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.71.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.71.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.72.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.72.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.72.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.73.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.73.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.73.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.74.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.74.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.74.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.75.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.75.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.75.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.76.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.76.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.76.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.77.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.77.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.77.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.78.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.78.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.78.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.79.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.79.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.79.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.8.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.8.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.8.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.80.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.80.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.80.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.81.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.81.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.81.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.82.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.82.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.82.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.83.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.83.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.83.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.84.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.84.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.84.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.85.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.85.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.85.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.86.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.86.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.86.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.87.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.87.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.87.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.88.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.88.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.88.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.89.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.89.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.89.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.9.down_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.9.gate_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.9.up_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.mlp.experts.90.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.90.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.90.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.91.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.91.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.91.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.92.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.92.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.92.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.93.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.93.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.93.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.94.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.94.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.94.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.95.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.95.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.95.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.96.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.96.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.96.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.97.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.97.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.97.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.98.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.98.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.98.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.99.down_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.99.gate_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.experts.99.up_proj.weight": "model-00007-of-00142.safetensors", + "model.layers.6.mlp.gate.e_score_correction_bias": "model-00008-of-00142.safetensors", + "model.layers.6.mlp.gate.weight": "model-00008-of-00142.safetensors", + "model.layers.6.mlp.shared_experts.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.6.mlp.shared_experts.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.6.mlp.shared_experts.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00008-of-00142.safetensors", + "model.layers.6.self_attn.k_norm.weight": "model-00006-of-00142.safetensors", + "model.layers.6.self_attn.k_proj.bias": "model-00006-of-00142.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.self_attn.q_norm.weight": "model-00006-of-00142.safetensors", + "model.layers.6.self_attn.q_proj.bias": "model-00006-of-00142.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.6.self_attn.v_proj.bias": "model-00006-of-00142.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00006-of-00142.safetensors", + "model.layers.60.input_layernorm.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.0.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.0.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.0.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.1.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.1.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.1.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.10.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.10.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.10.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.100.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.100.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.100.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.101.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.101.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.101.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.102.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.102.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.102.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.103.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.103.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.103.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.104.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.104.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.104.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.105.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.105.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.105.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.106.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.106.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.106.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.107.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.107.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.107.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.108.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.108.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.108.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.109.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.109.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.109.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.11.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.11.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.11.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.110.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.110.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.110.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.111.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.111.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.111.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.112.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.112.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.112.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.113.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.113.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.113.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.114.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.114.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.114.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.115.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.115.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.115.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.116.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.116.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.116.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.117.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.117.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.117.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.118.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.118.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.118.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.119.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.119.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.119.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.12.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.12.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.12.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.120.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.120.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.120.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.121.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.121.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.121.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.122.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.122.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.122.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.123.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.123.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.123.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.124.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.124.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.124.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.125.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.125.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.125.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.126.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.126.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.126.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.127.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.127.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.127.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.128.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.128.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.128.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.129.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.129.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.129.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.13.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.13.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.13.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.130.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.130.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.130.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.131.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.131.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.131.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.132.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.132.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.132.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.133.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.133.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.133.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.134.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.134.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.134.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.135.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.135.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.135.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.136.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.136.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.136.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.137.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.137.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.137.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.138.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.138.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.138.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.139.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.139.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.139.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.14.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.14.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.14.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.140.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.140.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.140.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.141.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.141.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.141.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.142.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.142.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.142.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.143.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.143.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.143.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.144.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.144.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.144.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.145.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.145.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.145.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.146.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.146.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.146.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.147.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.147.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.147.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.148.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.148.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.148.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.149.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.149.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.149.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.15.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.15.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.15.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.150.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.150.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.150.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.151.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.151.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.151.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.152.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.152.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.152.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.153.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.153.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.153.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.154.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.154.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.154.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.155.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.155.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.155.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.156.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.156.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.156.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.157.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.157.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.157.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.158.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.158.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.158.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.159.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.159.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.159.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.experts.16.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.16.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.16.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.17.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.17.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.17.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.18.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.18.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.18.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.19.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.19.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.19.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.2.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.2.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.2.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.20.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.20.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.20.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.21.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.21.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.21.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.22.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.22.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.22.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.23.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.23.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.23.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.24.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.24.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.24.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.25.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.25.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.25.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.26.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.26.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.26.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.27.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.27.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.27.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.28.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.28.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.28.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.29.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.29.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.29.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.3.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.3.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.3.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.30.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.30.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.30.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.31.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.31.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.31.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.32.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.32.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.32.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.33.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.33.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.33.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.34.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.34.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.34.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.35.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.35.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.35.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.36.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.36.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.36.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.37.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.37.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.37.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.38.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.38.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.38.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.39.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.39.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.39.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.4.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.4.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.4.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.40.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.40.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.40.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.41.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.41.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.41.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.42.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.42.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.42.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.43.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.43.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.43.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.44.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.44.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.44.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.45.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.45.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.45.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.46.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.46.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.46.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.47.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.47.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.47.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.48.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.48.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.48.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.49.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.49.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.49.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.5.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.5.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.5.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.50.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.50.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.50.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.51.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.51.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.51.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.52.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.52.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.52.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.53.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.53.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.53.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.54.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.54.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.54.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.55.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.55.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.55.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.56.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.56.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.56.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.57.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.57.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.57.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.58.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.58.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.58.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.59.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.59.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.59.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.6.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.6.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.6.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.60.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.60.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.60.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.61.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.61.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.61.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.62.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.62.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.62.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.63.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.63.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.63.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.64.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.64.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.64.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.65.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.65.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.65.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.66.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.66.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.66.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.67.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.67.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.67.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.68.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.68.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.68.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.69.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.69.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.69.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.7.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.7.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.7.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.70.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.70.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.70.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.71.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.71.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.71.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.72.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.72.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.72.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.73.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.73.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.73.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.74.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.74.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.74.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.75.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.75.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.75.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.76.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.76.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.76.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.77.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.77.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.77.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.78.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.78.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.78.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.79.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.79.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.79.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.8.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.8.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.8.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.80.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.80.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.80.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.81.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.81.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.81.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.82.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.82.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.82.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.83.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.83.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.83.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.84.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.84.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.84.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.85.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.85.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.85.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.86.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.86.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.86.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.87.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.87.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.87.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.88.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.88.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.88.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.89.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.89.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.89.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.9.down_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.9.gate_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.9.up_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.mlp.experts.90.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.90.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.90.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.91.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.91.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.91.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.92.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.92.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.92.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.93.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.93.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.93.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.94.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.94.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.94.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.95.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.95.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.95.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.96.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.96.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.96.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.97.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.97.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.97.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.98.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.98.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.98.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.99.down_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.99.gate_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.experts.99.up_proj.weight": "model-00092-of-00142.safetensors", + "model.layers.60.mlp.gate.e_score_correction_bias": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.gate.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.shared_experts.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.shared_experts.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.mlp.shared_experts.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.60.post_attention_layernorm.weight": "model-00093-of-00142.safetensors", + "model.layers.60.self_attn.k_norm.weight": "model-00091-of-00142.safetensors", + "model.layers.60.self_attn.k_proj.bias": "model-00091-of-00142.safetensors", + "model.layers.60.self_attn.k_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.self_attn.o_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.self_attn.q_norm.weight": "model-00091-of-00142.safetensors", + "model.layers.60.self_attn.q_proj.bias": "model-00091-of-00142.safetensors", + "model.layers.60.self_attn.q_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.60.self_attn.v_proj.bias": "model-00091-of-00142.safetensors", + "model.layers.60.self_attn.v_proj.weight": "model-00091-of-00142.safetensors", + "model.layers.61.input_layernorm.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.0.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.0.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.0.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.1.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.1.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.1.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.10.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.10.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.10.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.100.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.100.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.100.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.101.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.101.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.101.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.102.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.102.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.102.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.103.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.103.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.103.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.104.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.104.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.104.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.105.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.105.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.105.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.106.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.106.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.106.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.107.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.107.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.107.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.108.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.108.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.108.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.109.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.109.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.109.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.11.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.11.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.11.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.110.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.110.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.110.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.111.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.111.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.111.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.112.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.112.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.112.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.113.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.113.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.113.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.114.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.114.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.114.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.115.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.115.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.115.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.116.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.116.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.116.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.117.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.117.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.117.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.118.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.118.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.118.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.119.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.119.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.119.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.12.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.12.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.12.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.120.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.120.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.120.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.121.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.121.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.121.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.122.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.122.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.122.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.123.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.123.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.123.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.124.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.124.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.124.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.125.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.125.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.125.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.126.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.126.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.126.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.127.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.127.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.127.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.128.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.128.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.128.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.129.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.129.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.129.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.13.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.13.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.13.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.130.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.130.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.130.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.131.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.131.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.131.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.132.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.132.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.132.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.133.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.133.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.133.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.134.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.134.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.134.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.135.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.135.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.135.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.136.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.136.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.136.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.137.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.137.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.137.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.138.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.138.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.138.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.139.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.139.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.139.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.14.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.14.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.14.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.140.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.140.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.140.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.141.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.141.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.141.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.142.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.142.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.142.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.143.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.143.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.143.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.144.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.144.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.144.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.145.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.145.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.145.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.146.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.146.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.146.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.147.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.147.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.147.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.148.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.148.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.148.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.149.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.149.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.149.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.15.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.15.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.15.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.150.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.150.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.150.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.151.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.151.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.151.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.152.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.152.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.152.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.153.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.153.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.153.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.154.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.154.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.154.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.155.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.155.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.155.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.156.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.156.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.156.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.157.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.157.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.157.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.158.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.158.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.158.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.159.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.159.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.159.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.16.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.16.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.16.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.17.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.17.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.17.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.18.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.18.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.18.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.19.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.19.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.19.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.2.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.2.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.2.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.20.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.20.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.20.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.21.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.21.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.21.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.22.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.22.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.22.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.23.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.23.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.23.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.24.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.24.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.24.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.25.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.25.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.25.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.26.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.26.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.26.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.27.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.27.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.27.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.28.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.28.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.28.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.29.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.29.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.29.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.3.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.3.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.3.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.30.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.30.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.30.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.31.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.31.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.31.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.32.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.32.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.32.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.33.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.33.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.33.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.34.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.34.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.34.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.35.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.35.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.35.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.36.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.36.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.36.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.37.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.37.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.37.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.38.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.38.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.38.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.39.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.39.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.39.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.4.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.4.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.4.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.40.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.40.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.40.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.41.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.41.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.41.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.42.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.42.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.42.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.43.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.43.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.43.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.44.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.44.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.44.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.45.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.45.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.45.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.46.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.46.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.46.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.47.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.47.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.47.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.48.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.48.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.48.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.49.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.49.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.49.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.5.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.5.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.5.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.50.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.50.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.50.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.51.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.51.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.51.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.52.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.52.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.52.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.53.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.53.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.53.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.54.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.54.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.54.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.55.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.55.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.55.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.56.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.56.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.56.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.57.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.57.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.57.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.58.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.58.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.58.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.59.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.59.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.59.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.6.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.6.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.6.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.60.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.60.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.60.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.61.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.61.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.61.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.62.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.62.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.62.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.63.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.63.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.63.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.64.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.64.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.64.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.65.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.65.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.65.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.66.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.66.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.66.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.67.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.67.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.67.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.68.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.68.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.68.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.69.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.69.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.69.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.7.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.7.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.7.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.70.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.70.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.70.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.71.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.71.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.71.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.72.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.72.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.72.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.73.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.73.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.73.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.74.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.74.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.74.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.75.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.75.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.75.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.76.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.76.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.76.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.77.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.77.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.77.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.78.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.78.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.78.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.79.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.79.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.79.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.8.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.8.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.8.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.80.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.80.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.80.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.81.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.81.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.81.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.82.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.82.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.82.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.83.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.83.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.83.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.84.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.84.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.84.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.85.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.85.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.85.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.86.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.86.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.86.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.87.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.87.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.87.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.88.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.88.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.88.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.89.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.89.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.89.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.9.down_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.9.gate_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.9.up_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.mlp.experts.90.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.90.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.90.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.91.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.91.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.91.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.92.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.92.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.92.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.93.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.93.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.93.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.94.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.94.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.94.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.95.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.95.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.95.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.96.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.96.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.96.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.97.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.97.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.97.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.98.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.98.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.98.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.99.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.99.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.experts.99.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.gate.e_score_correction_bias": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.gate.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.shared_experts.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.shared_experts.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.mlp.shared_experts.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.61.post_attention_layernorm.weight": "model-00094-of-00142.safetensors", + "model.layers.61.self_attn.k_norm.weight": "model-00093-of-00142.safetensors", + "model.layers.61.self_attn.k_proj.bias": "model-00093-of-00142.safetensors", + "model.layers.61.self_attn.k_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.self_attn.o_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.self_attn.q_norm.weight": "model-00093-of-00142.safetensors", + "model.layers.61.self_attn.q_proj.bias": "model-00093-of-00142.safetensors", + "model.layers.61.self_attn.q_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.61.self_attn.v_proj.bias": "model-00093-of-00142.safetensors", + "model.layers.61.self_attn.v_proj.weight": "model-00093-of-00142.safetensors", + "model.layers.62.input_layernorm.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.0.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.0.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.0.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.1.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.1.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.1.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.10.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.10.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.10.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.100.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.100.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.100.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.101.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.101.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.101.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.102.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.102.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.102.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.103.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.103.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.103.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.104.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.104.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.104.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.105.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.105.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.105.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.106.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.106.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.106.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.107.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.107.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.107.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.108.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.108.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.108.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.109.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.109.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.109.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.11.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.11.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.11.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.110.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.110.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.110.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.111.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.111.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.111.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.112.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.112.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.112.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.113.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.113.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.113.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.114.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.114.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.114.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.115.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.115.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.115.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.116.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.116.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.116.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.117.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.117.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.117.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.118.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.118.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.118.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.119.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.119.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.119.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.12.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.12.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.12.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.120.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.120.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.120.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.121.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.121.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.121.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.122.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.122.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.122.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.123.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.123.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.123.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.124.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.124.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.124.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.125.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.125.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.125.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.126.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.126.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.126.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.127.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.127.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.127.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.128.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.128.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.128.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.129.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.129.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.129.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.13.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.13.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.13.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.130.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.130.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.130.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.131.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.131.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.131.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.132.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.132.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.132.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.133.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.133.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.133.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.134.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.134.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.134.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.135.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.135.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.135.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.136.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.136.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.136.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.137.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.137.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.137.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.138.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.138.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.138.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.139.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.139.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.139.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.14.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.14.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.14.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.140.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.140.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.140.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.141.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.141.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.141.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.142.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.142.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.142.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.143.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.143.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.143.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.144.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.144.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.144.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.145.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.145.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.145.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.146.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.146.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.146.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.147.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.147.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.147.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.148.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.148.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.148.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.149.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.149.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.149.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.15.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.15.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.15.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.150.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.150.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.150.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.151.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.151.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.151.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.152.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.152.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.152.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.153.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.153.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.153.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.154.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.154.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.154.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.155.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.155.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.155.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.156.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.156.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.156.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.157.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.157.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.157.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.158.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.158.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.158.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.159.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.159.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.159.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.experts.16.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.16.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.16.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.17.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.17.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.17.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.18.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.18.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.18.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.19.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.19.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.19.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.2.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.2.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.2.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.20.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.20.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.20.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.21.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.21.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.21.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.22.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.22.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.22.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.23.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.23.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.23.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.24.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.24.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.24.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.25.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.25.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.25.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.26.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.26.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.26.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.27.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.27.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.27.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.28.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.28.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.28.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.29.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.29.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.29.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.3.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.3.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.3.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.30.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.30.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.30.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.31.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.31.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.31.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.32.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.32.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.32.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.33.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.33.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.33.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.34.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.34.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.34.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.35.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.35.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.35.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.36.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.36.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.36.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.37.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.37.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.37.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.38.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.38.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.38.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.39.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.39.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.39.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.4.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.4.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.4.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.40.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.40.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.40.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.41.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.41.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.41.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.42.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.42.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.42.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.43.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.43.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.43.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.44.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.44.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.44.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.45.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.45.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.45.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.46.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.46.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.46.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.47.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.47.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.47.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.48.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.48.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.48.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.49.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.49.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.49.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.5.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.5.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.5.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.50.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.50.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.50.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.51.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.51.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.51.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.52.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.52.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.52.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.53.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.53.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.53.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.54.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.54.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.54.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.55.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.55.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.55.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.56.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.56.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.56.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.57.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.57.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.57.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.58.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.58.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.58.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.59.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.59.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.59.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.6.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.6.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.6.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.60.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.60.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.60.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.61.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.61.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.61.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.62.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.62.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.62.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.63.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.63.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.63.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.64.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.64.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.64.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.65.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.65.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.65.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.66.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.66.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.66.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.67.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.67.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.67.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.68.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.68.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.68.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.69.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.69.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.69.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.7.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.7.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.7.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.70.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.70.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.70.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.71.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.71.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.71.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.72.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.72.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.72.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.73.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.73.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.73.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.74.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.74.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.74.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.75.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.75.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.75.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.76.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.76.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.76.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.77.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.77.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.77.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.78.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.78.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.78.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.79.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.79.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.79.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.8.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.8.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.8.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.80.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.80.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.80.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.81.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.81.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.81.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.82.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.82.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.82.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.83.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.83.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.83.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.84.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.84.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.84.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.85.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.85.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.85.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.86.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.86.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.86.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.87.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.87.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.87.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.88.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.88.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.88.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.89.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.89.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.89.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.9.down_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.9.gate_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.9.up_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.mlp.experts.90.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.90.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.90.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.91.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.91.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.91.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.92.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.92.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.92.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.93.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.93.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.93.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.94.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.94.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.94.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.95.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.95.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.95.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.96.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.96.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.96.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.97.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.97.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.97.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.98.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.98.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.98.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.99.down_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.99.gate_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.experts.99.up_proj.weight": "model-00095-of-00142.safetensors", + "model.layers.62.mlp.gate.e_score_correction_bias": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.gate.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.shared_experts.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.shared_experts.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.mlp.shared_experts.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.62.post_attention_layernorm.weight": "model-00096-of-00142.safetensors", + "model.layers.62.self_attn.k_norm.weight": "model-00094-of-00142.safetensors", + "model.layers.62.self_attn.k_proj.bias": "model-00094-of-00142.safetensors", + "model.layers.62.self_attn.k_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.self_attn.o_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.self_attn.q_norm.weight": "model-00094-of-00142.safetensors", + "model.layers.62.self_attn.q_proj.bias": "model-00094-of-00142.safetensors", + "model.layers.62.self_attn.q_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.62.self_attn.v_proj.bias": "model-00094-of-00142.safetensors", + "model.layers.62.self_attn.v_proj.weight": "model-00094-of-00142.safetensors", + "model.layers.63.input_layernorm.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.0.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.0.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.0.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.1.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.1.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.1.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.10.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.10.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.10.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.100.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.100.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.100.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.101.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.101.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.101.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.102.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.102.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.102.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.103.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.103.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.103.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.104.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.104.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.104.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.105.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.105.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.105.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.106.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.106.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.106.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.107.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.107.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.107.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.108.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.108.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.108.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.109.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.109.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.109.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.11.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.11.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.11.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.110.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.110.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.110.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.111.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.111.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.111.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.112.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.112.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.112.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.113.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.113.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.113.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.114.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.114.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.114.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.115.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.115.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.115.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.116.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.116.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.116.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.117.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.117.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.117.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.118.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.118.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.118.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.119.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.119.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.119.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.12.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.12.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.12.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.120.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.120.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.120.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.121.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.121.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.121.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.122.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.122.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.122.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.123.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.123.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.123.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.124.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.124.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.124.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.125.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.125.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.125.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.126.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.126.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.126.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.127.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.127.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.127.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.128.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.128.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.128.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.129.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.129.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.129.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.13.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.13.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.13.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.130.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.130.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.130.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.131.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.131.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.131.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.132.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.132.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.132.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.133.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.133.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.133.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.134.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.134.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.134.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.135.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.135.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.135.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.136.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.136.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.136.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.137.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.137.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.137.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.138.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.138.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.138.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.139.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.139.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.139.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.14.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.14.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.14.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.140.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.140.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.140.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.141.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.141.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.141.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.142.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.142.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.142.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.143.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.143.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.143.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.144.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.144.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.144.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.145.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.145.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.145.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.146.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.146.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.146.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.147.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.147.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.147.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.148.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.148.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.148.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.149.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.149.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.149.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.15.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.15.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.15.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.150.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.150.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.150.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.151.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.151.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.151.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.152.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.152.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.152.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.153.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.153.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.153.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.154.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.154.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.154.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.155.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.155.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.155.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.156.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.156.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.156.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.157.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.157.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.157.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.158.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.158.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.158.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.159.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.159.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.159.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.16.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.16.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.16.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.17.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.17.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.17.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.18.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.18.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.18.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.19.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.19.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.19.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.2.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.2.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.2.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.20.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.20.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.20.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.21.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.21.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.21.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.22.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.22.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.22.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.23.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.23.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.23.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.24.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.24.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.24.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.25.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.25.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.25.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.26.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.26.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.26.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.27.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.27.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.27.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.28.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.28.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.28.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.29.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.29.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.29.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.3.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.3.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.3.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.30.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.30.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.30.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.31.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.31.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.31.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.32.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.32.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.32.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.33.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.33.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.33.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.34.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.34.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.34.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.35.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.35.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.35.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.36.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.36.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.36.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.37.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.37.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.37.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.38.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.38.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.38.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.39.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.39.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.39.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.4.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.4.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.4.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.40.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.40.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.40.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.41.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.41.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.41.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.42.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.42.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.42.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.43.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.43.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.43.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.44.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.44.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.44.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.45.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.45.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.45.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.46.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.46.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.46.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.47.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.47.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.47.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.48.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.48.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.48.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.49.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.49.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.49.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.5.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.5.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.5.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.50.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.50.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.50.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.51.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.51.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.51.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.52.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.52.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.52.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.53.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.53.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.53.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.54.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.54.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.54.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.55.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.55.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.55.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.56.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.56.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.56.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.57.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.57.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.57.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.58.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.58.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.58.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.59.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.59.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.59.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.6.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.6.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.6.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.60.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.60.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.60.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.61.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.61.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.61.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.62.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.62.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.62.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.63.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.63.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.63.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.64.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.64.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.64.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.65.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.65.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.65.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.66.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.66.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.66.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.67.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.67.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.67.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.68.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.68.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.68.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.69.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.69.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.69.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.7.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.7.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.7.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.70.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.70.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.70.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.71.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.71.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.71.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.72.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.72.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.72.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.73.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.73.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.73.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.74.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.74.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.74.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.75.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.75.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.75.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.76.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.76.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.76.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.77.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.77.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.77.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.78.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.78.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.78.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.79.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.79.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.79.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.8.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.8.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.8.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.80.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.80.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.80.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.81.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.81.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.81.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.82.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.82.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.82.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.83.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.83.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.83.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.84.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.84.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.84.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.85.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.85.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.85.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.86.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.86.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.86.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.87.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.87.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.87.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.88.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.88.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.88.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.89.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.89.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.89.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.9.down_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.9.gate_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.9.up_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.mlp.experts.90.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.90.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.90.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.91.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.91.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.91.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.92.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.92.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.92.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.93.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.93.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.93.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.94.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.94.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.94.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.95.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.95.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.95.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.96.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.96.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.96.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.97.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.97.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.97.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.98.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.98.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.98.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.99.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.99.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.experts.99.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.gate.e_score_correction_bias": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.gate.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.shared_experts.down_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.shared_experts.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.mlp.shared_experts.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.63.post_attention_layernorm.weight": "model-00097-of-00142.safetensors", + "model.layers.63.self_attn.k_norm.weight": "model-00096-of-00142.safetensors", + "model.layers.63.self_attn.k_proj.bias": "model-00096-of-00142.safetensors", + "model.layers.63.self_attn.k_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.self_attn.o_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.self_attn.q_norm.weight": "model-00096-of-00142.safetensors", + "model.layers.63.self_attn.q_proj.bias": "model-00096-of-00142.safetensors", + "model.layers.63.self_attn.q_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.63.self_attn.v_proj.bias": "model-00096-of-00142.safetensors", + "model.layers.63.self_attn.v_proj.weight": "model-00096-of-00142.safetensors", + "model.layers.64.input_layernorm.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.0.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.0.gate_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.64.mlp.experts.0.up_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.64.mlp.experts.1.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.1.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.1.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.10.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.10.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.10.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.100.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.100.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.100.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.101.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.101.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.101.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.102.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.102.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.102.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.103.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.103.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.103.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.104.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.104.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.104.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.105.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.105.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.105.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.106.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.106.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.106.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.107.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.107.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.107.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.108.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.108.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.108.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.109.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.109.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.109.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.11.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.11.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.11.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.110.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.110.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.110.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.111.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.111.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.111.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.112.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.112.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.112.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.113.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.113.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.113.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.114.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.114.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.114.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.115.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.115.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.115.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.116.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.116.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.116.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.117.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.117.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.117.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.118.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.118.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.118.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.119.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.119.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.119.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.12.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.12.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.12.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.120.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.120.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.120.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.121.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.121.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.121.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.122.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.122.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.122.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.123.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.123.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.123.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.124.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.124.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.124.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.125.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.125.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.125.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.126.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.126.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.126.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.127.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.127.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.127.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.128.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.128.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.128.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.129.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.129.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.129.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.13.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.13.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.13.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.130.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.130.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.130.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.131.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.131.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.131.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.132.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.132.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.132.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.133.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.133.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.133.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.134.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.134.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.134.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.135.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.135.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.135.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.136.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.136.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.136.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.137.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.137.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.137.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.138.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.138.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.138.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.139.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.139.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.139.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.14.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.14.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.14.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.140.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.140.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.140.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.141.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.141.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.141.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.142.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.142.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.142.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.143.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.143.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.143.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.144.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.144.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.144.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.145.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.145.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.145.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.146.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.146.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.146.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.147.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.147.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.147.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.148.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.148.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.148.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.149.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.149.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.149.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.15.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.15.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.15.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.150.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.150.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.150.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.151.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.151.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.151.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.152.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.152.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.152.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.153.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.153.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.153.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.154.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.154.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.154.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.155.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.155.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.155.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.156.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.156.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.156.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.157.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.157.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.157.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.158.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.158.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.158.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.159.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.159.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.159.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.experts.16.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.16.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.16.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.17.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.17.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.17.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.18.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.18.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.18.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.19.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.19.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.19.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.2.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.2.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.2.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.20.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.20.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.20.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.21.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.21.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.21.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.22.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.22.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.22.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.23.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.23.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.23.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.24.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.24.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.24.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.25.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.25.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.25.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.26.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.26.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.26.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.27.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.27.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.27.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.28.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.28.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.28.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.29.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.29.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.29.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.3.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.3.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.3.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.30.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.30.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.30.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.31.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.31.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.31.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.32.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.32.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.32.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.33.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.33.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.33.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.34.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.34.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.34.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.35.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.35.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.35.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.36.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.36.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.36.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.37.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.37.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.37.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.38.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.38.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.38.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.39.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.39.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.39.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.4.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.4.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.4.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.40.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.40.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.40.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.41.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.41.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.41.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.42.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.42.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.42.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.43.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.43.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.43.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.44.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.44.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.44.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.45.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.45.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.45.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.46.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.46.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.46.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.47.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.47.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.47.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.48.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.48.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.48.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.49.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.49.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.49.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.5.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.5.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.5.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.50.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.50.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.50.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.51.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.51.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.51.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.52.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.52.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.52.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.53.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.53.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.53.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.54.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.54.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.54.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.55.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.55.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.55.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.56.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.56.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.56.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.57.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.57.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.57.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.58.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.58.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.58.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.59.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.59.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.59.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.6.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.6.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.6.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.60.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.60.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.60.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.61.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.61.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.61.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.62.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.62.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.62.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.63.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.63.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.63.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.64.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.64.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.64.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.65.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.65.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.65.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.66.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.66.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.66.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.67.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.67.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.67.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.68.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.68.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.68.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.69.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.69.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.69.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.7.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.7.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.7.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.70.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.70.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.70.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.71.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.71.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.71.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.72.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.72.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.72.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.73.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.73.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.73.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.74.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.74.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.74.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.75.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.75.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.75.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.76.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.76.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.76.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.77.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.77.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.77.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.78.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.78.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.78.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.79.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.79.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.79.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.8.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.8.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.8.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.80.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.80.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.80.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.81.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.81.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.81.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.82.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.82.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.82.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.83.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.83.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.83.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.84.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.84.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.84.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.85.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.85.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.85.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.86.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.86.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.86.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.87.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.87.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.87.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.88.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.88.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.88.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.89.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.89.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.89.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.9.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.9.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.9.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.90.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.90.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.90.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.91.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.91.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.91.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.92.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.92.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.92.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.93.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.93.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.93.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.94.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.94.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.94.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.95.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.95.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.95.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.96.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.96.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.96.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.97.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.97.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.97.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.98.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.98.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.98.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.99.down_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.99.gate_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.experts.99.up_proj.weight": "model-00098-of-00142.safetensors", + "model.layers.64.mlp.gate.e_score_correction_bias": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.gate.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.shared_experts.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.shared_experts.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.mlp.shared_experts.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.64.post_attention_layernorm.weight": "model-00099-of-00142.safetensors", + "model.layers.64.self_attn.k_norm.weight": "model-00097-of-00142.safetensors", + "model.layers.64.self_attn.k_proj.bias": "model-00097-of-00142.safetensors", + "model.layers.64.self_attn.k_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.64.self_attn.o_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.64.self_attn.q_norm.weight": "model-00097-of-00142.safetensors", + "model.layers.64.self_attn.q_proj.bias": "model-00097-of-00142.safetensors", + "model.layers.64.self_attn.q_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.64.self_attn.v_proj.bias": "model-00097-of-00142.safetensors", + "model.layers.64.self_attn.v_proj.weight": "model-00097-of-00142.safetensors", + "model.layers.65.input_layernorm.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.0.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.0.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.0.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.1.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.1.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.1.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.10.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.10.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.10.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.100.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.100.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.100.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.101.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.101.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.101.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.102.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.102.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.102.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.103.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.103.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.103.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.104.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.104.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.104.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.105.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.105.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.105.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.106.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.106.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.106.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.107.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.107.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.107.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.108.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.108.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.108.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.109.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.109.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.109.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.11.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.11.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.11.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.110.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.110.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.110.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.111.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.111.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.111.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.112.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.112.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.112.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.113.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.113.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.113.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.114.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.114.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.114.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.115.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.115.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.115.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.116.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.116.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.116.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.117.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.117.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.117.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.118.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.118.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.118.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.119.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.119.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.119.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.12.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.12.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.12.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.120.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.120.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.120.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.121.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.121.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.121.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.122.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.122.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.122.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.123.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.123.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.123.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.124.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.124.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.124.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.125.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.125.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.125.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.126.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.126.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.126.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.127.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.127.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.127.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.128.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.128.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.128.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.129.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.129.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.129.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.13.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.13.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.13.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.130.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.130.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.130.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.131.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.131.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.131.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.132.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.132.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.132.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.133.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.133.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.133.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.134.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.134.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.134.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.135.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.135.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.135.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.136.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.136.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.136.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.137.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.137.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.137.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.138.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.138.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.138.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.139.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.139.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.139.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.14.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.14.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.14.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.140.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.140.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.140.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.141.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.141.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.141.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.142.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.142.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.142.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.143.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.143.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.143.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.144.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.144.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.144.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.145.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.145.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.145.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.146.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.146.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.146.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.147.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.147.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.147.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.148.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.148.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.148.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.149.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.149.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.149.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.15.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.15.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.15.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.150.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.150.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.150.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.151.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.151.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.151.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.152.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.152.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.152.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.153.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.153.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.153.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.154.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.154.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.154.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.155.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.155.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.155.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.156.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.156.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.156.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.157.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.157.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.157.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.158.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.158.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.158.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.159.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.159.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.159.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.experts.16.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.16.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.16.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.17.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.17.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.17.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.18.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.18.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.18.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.19.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.19.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.19.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.2.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.2.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.2.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.20.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.20.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.20.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.21.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.21.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.21.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.22.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.22.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.22.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.23.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.23.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.23.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.24.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.24.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.24.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.25.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.25.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.25.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.26.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.26.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.26.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.27.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.27.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.27.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.28.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.28.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.28.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.29.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.29.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.29.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.3.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.3.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.3.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.30.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.30.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.30.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.31.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.31.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.31.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.32.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.32.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.32.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.33.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.33.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.33.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.34.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.34.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.34.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.35.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.35.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.35.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.36.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.36.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.36.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.37.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.37.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.37.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.38.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.38.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.38.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.39.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.39.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.39.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.4.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.4.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.4.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.40.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.40.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.40.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.41.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.41.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.41.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.42.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.42.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.42.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.43.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.43.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.43.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.44.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.44.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.44.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.45.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.45.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.45.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.46.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.46.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.46.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.47.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.47.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.47.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.48.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.48.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.48.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.49.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.49.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.49.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.5.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.5.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.5.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.50.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.50.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.50.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.51.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.51.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.51.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.52.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.52.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.52.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.53.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.53.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.53.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.54.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.54.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.54.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.55.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.55.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.55.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.56.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.56.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.56.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.57.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.57.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.57.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.58.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.58.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.58.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.59.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.59.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.59.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.6.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.6.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.6.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.60.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.60.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.60.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.61.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.61.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.61.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.62.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.62.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.62.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.63.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.63.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.63.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.64.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.64.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.64.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.65.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.65.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.65.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.66.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.66.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.66.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.67.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.67.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.67.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.68.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.68.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.68.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.69.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.69.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.69.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.7.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.7.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.7.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.70.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.70.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.70.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.71.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.71.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.71.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.72.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.72.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.72.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.73.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.73.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.73.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.74.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.74.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.74.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.75.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.75.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.75.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.76.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.76.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.76.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.77.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.77.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.77.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.78.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.78.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.78.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.79.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.79.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.79.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.8.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.8.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.8.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.80.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.80.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.80.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.81.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.81.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.81.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.82.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.82.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.82.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.83.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.83.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.83.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.84.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.84.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.84.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.85.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.85.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.85.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.86.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.86.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.86.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.87.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.87.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.87.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.88.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.88.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.88.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.89.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.89.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.89.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.9.down_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.9.gate_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.9.up_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.mlp.experts.90.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.90.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.90.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.91.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.91.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.91.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.92.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.92.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.92.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.93.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.93.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.93.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.94.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.94.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.94.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.95.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.95.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.95.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.96.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.96.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.96.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.97.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.97.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.97.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.98.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.98.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.98.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.99.down_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.99.gate_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.experts.99.up_proj.weight": "model-00100-of-00142.safetensors", + "model.layers.65.mlp.gate.e_score_correction_bias": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.gate.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.shared_experts.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.shared_experts.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.mlp.shared_experts.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.65.post_attention_layernorm.weight": "model-00101-of-00142.safetensors", + "model.layers.65.self_attn.k_norm.weight": "model-00099-of-00142.safetensors", + "model.layers.65.self_attn.k_proj.bias": "model-00099-of-00142.safetensors", + "model.layers.65.self_attn.k_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.self_attn.o_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.self_attn.q_norm.weight": "model-00099-of-00142.safetensors", + "model.layers.65.self_attn.q_proj.bias": "model-00099-of-00142.safetensors", + "model.layers.65.self_attn.q_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.65.self_attn.v_proj.bias": "model-00099-of-00142.safetensors", + "model.layers.65.self_attn.v_proj.weight": "model-00099-of-00142.safetensors", + "model.layers.66.input_layernorm.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.0.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.0.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.0.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.1.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.1.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.1.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.10.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.10.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.10.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.100.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.100.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.100.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.101.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.101.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.101.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.102.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.102.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.102.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.103.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.103.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.103.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.104.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.104.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.104.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.105.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.105.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.105.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.106.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.106.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.106.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.107.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.107.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.107.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.108.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.108.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.108.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.109.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.109.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.109.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.11.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.11.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.11.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.110.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.110.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.110.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.111.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.111.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.111.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.112.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.112.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.112.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.113.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.113.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.113.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.114.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.114.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.114.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.115.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.115.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.115.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.116.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.116.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.116.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.117.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.117.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.117.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.118.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.118.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.118.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.119.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.119.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.119.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.12.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.12.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.12.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.120.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.120.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.120.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.121.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.121.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.121.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.122.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.122.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.122.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.123.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.123.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.123.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.124.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.124.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.124.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.125.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.125.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.125.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.126.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.126.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.126.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.127.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.127.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.127.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.128.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.128.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.128.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.129.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.129.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.129.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.13.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.13.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.13.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.130.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.130.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.130.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.131.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.131.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.131.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.132.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.132.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.132.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.133.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.133.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.133.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.134.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.134.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.134.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.135.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.135.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.135.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.136.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.136.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.136.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.137.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.137.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.137.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.138.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.138.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.138.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.139.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.139.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.139.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.14.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.14.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.14.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.140.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.140.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.140.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.141.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.141.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.141.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.142.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.142.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.142.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.143.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.143.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.143.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.144.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.144.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.144.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.145.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.145.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.145.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.146.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.146.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.146.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.147.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.147.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.147.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.148.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.148.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.148.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.149.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.149.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.149.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.15.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.15.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.15.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.150.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.150.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.150.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.151.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.151.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.151.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.152.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.152.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.152.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.153.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.153.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.153.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.154.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.154.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.154.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.155.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.155.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.155.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.156.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.156.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.156.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.157.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.157.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.157.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.158.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.158.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.158.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.159.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.159.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.159.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.16.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.16.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.16.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.17.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.17.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.17.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.18.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.18.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.18.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.19.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.19.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.19.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.2.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.2.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.2.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.20.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.20.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.20.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.21.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.21.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.21.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.22.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.22.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.22.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.23.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.23.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.23.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.24.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.24.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.24.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.25.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.25.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.25.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.26.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.26.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.26.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.27.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.27.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.27.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.28.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.28.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.28.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.29.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.29.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.29.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.3.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.3.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.3.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.30.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.30.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.30.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.31.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.31.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.31.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.32.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.32.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.32.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.33.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.33.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.33.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.34.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.34.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.34.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.35.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.35.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.35.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.36.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.36.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.36.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.37.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.37.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.37.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.38.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.38.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.38.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.39.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.39.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.39.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.4.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.4.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.4.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.40.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.40.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.40.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.41.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.41.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.41.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.42.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.42.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.42.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.43.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.43.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.43.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.44.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.44.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.44.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.45.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.45.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.45.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.46.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.46.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.46.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.47.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.47.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.47.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.48.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.48.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.48.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.49.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.49.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.49.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.5.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.5.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.5.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.50.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.50.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.50.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.51.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.51.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.51.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.52.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.52.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.52.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.53.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.53.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.53.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.54.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.54.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.54.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.55.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.55.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.55.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.56.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.56.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.56.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.57.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.57.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.57.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.58.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.58.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.58.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.59.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.59.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.59.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.6.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.6.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.6.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.60.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.60.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.60.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.61.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.61.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.61.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.62.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.62.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.62.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.63.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.63.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.63.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.64.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.64.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.64.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.65.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.65.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.65.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.66.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.66.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.66.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.67.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.67.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.67.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.68.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.68.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.68.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.69.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.69.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.69.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.7.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.7.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.7.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.70.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.70.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.70.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.71.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.71.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.71.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.72.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.72.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.72.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.73.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.73.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.73.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.74.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.74.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.74.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.75.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.75.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.75.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.76.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.76.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.76.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.77.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.77.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.77.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.78.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.78.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.78.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.79.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.79.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.79.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.8.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.8.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.8.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.80.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.80.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.80.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.81.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.81.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.81.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.82.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.82.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.82.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.83.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.83.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.83.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.84.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.84.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.84.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.85.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.85.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.85.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.86.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.86.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.86.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.87.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.87.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.87.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.88.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.88.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.88.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.89.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.89.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.89.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.9.down_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.9.gate_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.9.up_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.mlp.experts.90.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.90.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.90.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.91.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.91.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.91.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.92.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.92.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.92.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.93.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.93.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.93.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.94.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.94.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.94.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.95.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.95.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.95.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.96.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.96.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.96.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.97.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.97.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.97.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.98.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.98.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.98.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.99.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.99.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.experts.99.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.gate.e_score_correction_bias": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.gate.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.shared_experts.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.shared_experts.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.mlp.shared_experts.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.66.post_attention_layernorm.weight": "model-00102-of-00142.safetensors", + "model.layers.66.self_attn.k_norm.weight": "model-00101-of-00142.safetensors", + "model.layers.66.self_attn.k_proj.bias": "model-00101-of-00142.safetensors", + "model.layers.66.self_attn.k_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.self_attn.o_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.self_attn.q_norm.weight": "model-00101-of-00142.safetensors", + "model.layers.66.self_attn.q_proj.bias": "model-00101-of-00142.safetensors", + "model.layers.66.self_attn.q_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.66.self_attn.v_proj.bias": "model-00101-of-00142.safetensors", + "model.layers.66.self_attn.v_proj.weight": "model-00101-of-00142.safetensors", + "model.layers.67.input_layernorm.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.0.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.0.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.0.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.1.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.1.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.1.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.10.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.10.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.10.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.100.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.100.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.100.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.101.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.101.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.101.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.102.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.102.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.102.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.103.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.103.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.103.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.104.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.104.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.104.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.105.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.105.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.105.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.106.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.106.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.106.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.107.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.107.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.107.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.108.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.108.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.108.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.109.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.109.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.109.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.11.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.11.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.11.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.110.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.110.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.110.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.111.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.111.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.111.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.112.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.112.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.112.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.113.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.113.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.113.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.114.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.114.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.114.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.115.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.115.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.115.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.116.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.116.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.116.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.117.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.117.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.117.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.118.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.118.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.118.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.119.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.119.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.119.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.12.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.12.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.12.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.120.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.120.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.120.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.121.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.121.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.121.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.122.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.122.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.122.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.123.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.123.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.123.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.124.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.124.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.124.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.125.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.125.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.125.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.126.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.126.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.126.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.127.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.127.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.127.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.128.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.128.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.128.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.129.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.129.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.129.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.13.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.13.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.13.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.130.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.130.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.130.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.131.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.131.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.131.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.132.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.132.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.132.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.133.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.133.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.133.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.134.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.134.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.134.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.135.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.135.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.135.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.136.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.136.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.136.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.137.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.137.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.137.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.138.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.138.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.138.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.139.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.139.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.139.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.14.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.14.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.14.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.140.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.140.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.140.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.141.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.141.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.141.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.142.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.142.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.142.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.143.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.143.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.143.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.144.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.144.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.144.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.145.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.145.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.145.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.146.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.146.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.146.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.147.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.147.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.147.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.148.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.148.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.148.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.149.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.149.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.149.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.15.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.15.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.15.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.150.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.150.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.150.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.151.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.151.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.151.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.152.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.152.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.152.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.153.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.153.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.153.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.154.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.154.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.154.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.155.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.155.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.155.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.156.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.156.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.156.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.157.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.157.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.157.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.158.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.158.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.158.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.159.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.159.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.159.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.experts.16.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.16.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.16.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.17.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.17.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.17.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.18.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.18.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.18.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.19.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.19.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.19.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.2.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.2.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.2.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.20.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.20.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.20.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.21.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.21.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.21.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.22.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.22.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.22.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.23.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.23.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.23.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.24.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.24.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.24.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.25.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.25.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.25.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.26.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.26.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.26.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.27.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.27.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.27.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.28.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.28.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.28.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.29.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.29.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.29.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.3.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.3.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.3.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.30.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.30.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.30.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.31.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.31.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.31.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.32.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.32.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.32.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.33.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.33.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.33.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.34.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.34.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.34.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.35.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.35.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.35.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.36.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.36.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.36.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.37.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.37.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.37.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.38.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.38.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.38.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.39.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.39.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.39.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.4.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.4.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.4.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.40.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.40.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.40.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.41.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.41.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.41.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.42.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.42.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.42.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.43.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.43.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.43.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.44.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.44.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.44.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.45.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.45.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.45.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.46.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.46.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.46.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.47.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.47.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.47.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.48.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.48.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.48.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.49.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.49.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.49.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.5.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.5.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.5.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.50.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.50.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.50.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.51.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.51.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.51.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.52.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.52.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.52.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.53.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.53.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.53.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.54.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.54.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.54.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.55.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.55.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.55.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.56.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.56.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.56.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.57.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.57.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.57.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.58.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.58.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.58.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.59.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.59.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.59.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.6.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.6.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.6.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.60.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.60.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.60.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.61.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.61.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.61.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.62.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.62.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.62.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.63.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.63.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.63.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.64.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.64.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.64.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.65.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.65.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.65.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.66.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.66.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.66.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.67.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.67.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.67.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.68.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.68.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.68.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.69.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.69.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.69.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.7.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.7.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.7.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.70.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.70.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.70.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.71.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.71.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.71.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.72.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.72.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.72.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.73.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.73.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.73.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.74.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.74.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.74.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.75.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.75.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.75.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.76.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.76.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.76.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.77.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.77.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.77.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.78.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.78.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.78.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.79.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.79.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.79.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.8.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.8.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.8.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.80.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.80.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.80.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.81.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.81.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.81.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.82.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.82.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.82.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.83.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.83.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.83.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.84.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.84.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.84.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.85.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.85.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.85.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.86.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.86.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.86.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.87.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.87.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.87.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.88.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.88.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.88.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.89.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.89.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.89.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.9.down_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.9.gate_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.9.up_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.mlp.experts.90.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.90.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.90.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.91.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.91.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.91.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.92.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.92.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.92.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.93.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.93.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.93.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.94.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.94.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.94.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.95.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.95.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.95.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.96.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.96.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.96.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.97.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.97.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.97.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.98.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.98.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.98.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.99.down_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.99.gate_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.experts.99.up_proj.weight": "model-00103-of-00142.safetensors", + "model.layers.67.mlp.gate.e_score_correction_bias": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.gate.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.shared_experts.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.shared_experts.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.mlp.shared_experts.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.67.post_attention_layernorm.weight": "model-00104-of-00142.safetensors", + "model.layers.67.self_attn.k_norm.weight": "model-00102-of-00142.safetensors", + "model.layers.67.self_attn.k_proj.bias": "model-00102-of-00142.safetensors", + "model.layers.67.self_attn.k_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.self_attn.o_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.self_attn.q_norm.weight": "model-00102-of-00142.safetensors", + "model.layers.67.self_attn.q_proj.bias": "model-00102-of-00142.safetensors", + "model.layers.67.self_attn.q_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.67.self_attn.v_proj.bias": "model-00102-of-00142.safetensors", + "model.layers.67.self_attn.v_proj.weight": "model-00102-of-00142.safetensors", + "model.layers.68.input_layernorm.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.0.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.0.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.0.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.1.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.1.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.1.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.10.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.10.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.10.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.100.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.100.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.100.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.101.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.101.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.101.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.102.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.102.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.102.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.103.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.103.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.103.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.104.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.104.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.104.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.105.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.105.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.105.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.106.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.106.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.106.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.107.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.107.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.107.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.108.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.108.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.108.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.109.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.109.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.109.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.11.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.11.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.11.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.110.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.110.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.110.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.111.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.111.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.111.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.112.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.112.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.112.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.113.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.113.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.113.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.114.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.114.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.114.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.115.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.115.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.115.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.116.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.116.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.116.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.117.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.117.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.117.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.118.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.118.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.118.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.119.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.119.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.119.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.12.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.12.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.12.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.120.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.120.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.120.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.121.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.121.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.121.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.122.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.122.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.122.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.123.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.123.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.123.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.124.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.124.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.124.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.125.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.125.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.125.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.126.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.126.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.126.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.127.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.127.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.127.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.128.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.128.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.128.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.129.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.129.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.129.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.13.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.13.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.13.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.130.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.130.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.130.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.131.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.131.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.131.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.132.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.132.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.132.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.133.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.133.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.133.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.134.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.134.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.134.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.135.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.135.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.135.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.136.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.136.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.136.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.137.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.137.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.137.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.138.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.138.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.138.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.139.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.139.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.139.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.14.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.14.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.14.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.140.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.140.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.140.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.141.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.141.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.141.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.142.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.142.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.142.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.143.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.143.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.143.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.144.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.144.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.144.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.145.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.145.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.145.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.146.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.146.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.146.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.147.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.147.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.147.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.148.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.148.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.148.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.149.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.149.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.149.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.15.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.15.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.15.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.150.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.150.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.150.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.151.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.151.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.151.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.152.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.152.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.152.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.153.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.153.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.153.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.154.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.154.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.154.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.155.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.155.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.155.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.156.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.156.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.156.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.157.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.157.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.157.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.158.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.158.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.158.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.159.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.159.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.159.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.16.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.16.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.16.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.17.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.17.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.17.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.18.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.18.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.18.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.19.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.19.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.19.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.2.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.2.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.2.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.20.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.20.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.20.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.21.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.21.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.21.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.22.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.22.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.22.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.23.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.23.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.23.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.24.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.24.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.24.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.25.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.25.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.25.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.26.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.26.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.26.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.27.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.27.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.27.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.28.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.28.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.28.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.29.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.29.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.29.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.3.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.3.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.3.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.30.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.30.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.30.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.31.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.31.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.31.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.32.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.32.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.32.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.33.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.33.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.33.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.34.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.34.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.34.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.35.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.35.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.35.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.36.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.36.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.36.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.37.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.37.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.37.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.38.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.38.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.38.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.39.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.39.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.39.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.4.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.4.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.4.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.40.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.40.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.40.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.41.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.41.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.41.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.42.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.42.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.42.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.43.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.43.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.43.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.44.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.44.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.44.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.45.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.45.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.45.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.46.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.46.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.46.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.47.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.47.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.47.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.48.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.48.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.48.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.49.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.49.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.49.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.5.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.5.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.5.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.50.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.50.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.50.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.51.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.51.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.51.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.52.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.52.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.52.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.53.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.53.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.53.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.54.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.54.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.54.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.55.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.55.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.55.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.56.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.56.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.56.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.57.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.57.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.57.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.58.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.58.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.58.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.59.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.59.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.59.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.6.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.6.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.6.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.60.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.60.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.60.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.61.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.61.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.61.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.62.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.62.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.62.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.63.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.63.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.63.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.64.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.64.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.64.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.65.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.65.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.65.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.66.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.66.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.66.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.67.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.67.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.67.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.68.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.68.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.68.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.69.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.69.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.69.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.7.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.7.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.7.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.70.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.70.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.70.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.71.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.71.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.71.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.72.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.72.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.72.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.73.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.73.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.73.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.74.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.74.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.74.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.75.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.75.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.75.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.76.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.76.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.76.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.77.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.77.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.77.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.78.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.78.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.78.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.79.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.79.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.79.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.8.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.8.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.8.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.80.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.80.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.80.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.81.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.81.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.81.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.82.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.82.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.82.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.83.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.83.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.83.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.84.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.84.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.84.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.85.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.85.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.85.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.86.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.86.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.86.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.87.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.87.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.87.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.88.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.88.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.88.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.89.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.89.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.89.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.9.down_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.9.gate_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.9.up_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.mlp.experts.90.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.90.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.90.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.91.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.91.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.91.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.92.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.92.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.92.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.93.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.93.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.93.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.94.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.94.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.94.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.95.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.95.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.95.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.96.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.96.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.96.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.97.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.97.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.97.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.98.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.98.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.98.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.99.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.99.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.experts.99.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.gate.e_score_correction_bias": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.gate.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.shared_experts.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.shared_experts.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.mlp.shared_experts.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.68.post_attention_layernorm.weight": "model-00105-of-00142.safetensors", + "model.layers.68.self_attn.k_norm.weight": "model-00104-of-00142.safetensors", + "model.layers.68.self_attn.k_proj.bias": "model-00104-of-00142.safetensors", + "model.layers.68.self_attn.k_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.self_attn.o_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.self_attn.q_norm.weight": "model-00104-of-00142.safetensors", + "model.layers.68.self_attn.q_proj.bias": "model-00104-of-00142.safetensors", + "model.layers.68.self_attn.q_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.68.self_attn.v_proj.bias": "model-00104-of-00142.safetensors", + "model.layers.68.self_attn.v_proj.weight": "model-00104-of-00142.safetensors", + "model.layers.69.input_layernorm.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.0.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.0.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.0.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.1.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.1.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.1.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.10.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.10.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.10.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.100.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.100.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.100.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.101.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.101.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.101.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.102.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.102.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.102.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.103.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.103.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.103.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.104.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.104.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.104.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.105.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.105.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.105.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.106.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.106.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.106.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.107.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.107.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.107.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.108.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.108.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.108.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.109.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.109.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.109.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.11.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.11.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.11.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.110.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.110.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.110.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.111.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.111.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.111.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.112.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.112.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.112.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.113.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.113.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.113.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.114.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.114.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.114.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.115.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.115.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.115.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.116.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.116.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.116.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.117.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.117.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.117.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.118.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.118.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.118.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.119.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.119.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.119.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.12.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.12.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.12.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.120.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.120.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.120.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.121.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.121.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.121.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.122.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.122.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.122.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.123.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.123.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.123.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.124.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.124.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.124.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.125.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.125.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.125.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.126.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.126.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.126.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.127.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.127.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.127.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.128.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.128.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.128.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.129.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.129.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.129.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.13.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.13.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.13.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.130.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.130.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.130.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.131.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.131.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.131.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.132.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.132.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.132.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.133.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.133.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.133.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.134.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.134.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.134.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.135.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.135.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.135.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.136.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.136.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.136.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.137.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.137.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.137.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.138.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.138.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.138.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.139.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.139.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.139.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.14.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.14.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.14.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.140.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.140.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.140.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.141.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.141.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.141.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.142.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.142.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.142.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.143.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.143.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.143.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.144.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.144.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.144.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.145.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.145.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.145.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.146.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.146.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.146.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.147.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.147.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.147.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.148.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.148.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.148.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.149.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.149.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.149.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.15.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.15.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.15.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.150.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.150.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.150.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.151.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.151.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.151.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.152.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.152.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.152.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.153.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.153.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.153.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.154.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.154.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.154.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.155.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.155.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.155.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.156.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.156.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.156.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.157.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.157.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.157.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.158.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.158.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.158.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.159.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.159.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.159.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.experts.16.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.16.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.16.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.17.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.17.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.17.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.18.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.18.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.18.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.19.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.19.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.19.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.2.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.2.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.2.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.20.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.20.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.20.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.21.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.21.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.21.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.22.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.22.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.22.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.23.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.23.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.23.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.24.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.24.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.24.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.25.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.25.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.25.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.26.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.26.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.26.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.27.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.27.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.27.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.28.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.28.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.28.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.29.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.29.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.29.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.3.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.3.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.3.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.30.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.30.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.30.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.31.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.31.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.31.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.32.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.32.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.32.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.33.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.33.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.33.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.34.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.34.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.34.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.35.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.35.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.35.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.36.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.36.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.36.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.37.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.37.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.37.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.38.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.38.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.38.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.39.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.39.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.39.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.4.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.4.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.4.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.40.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.40.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.40.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.41.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.41.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.41.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.42.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.42.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.42.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.43.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.43.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.43.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.44.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.44.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.44.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.45.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.45.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.45.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.46.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.46.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.46.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.47.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.47.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.47.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.48.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.48.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.48.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.49.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.49.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.49.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.5.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.5.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.5.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.50.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.50.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.50.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.51.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.51.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.51.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.52.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.52.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.52.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.53.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.53.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.53.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.54.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.54.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.54.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.55.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.55.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.55.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.56.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.56.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.56.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.57.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.57.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.57.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.58.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.58.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.58.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.59.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.59.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.59.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.6.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.6.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.6.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.60.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.60.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.60.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.61.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.61.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.61.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.62.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.62.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.62.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.63.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.63.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.63.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.64.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.64.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.64.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.65.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.65.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.65.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.66.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.66.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.66.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.67.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.67.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.67.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.68.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.68.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.68.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.69.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.69.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.69.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.7.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.7.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.7.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.70.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.70.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.70.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.71.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.71.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.71.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.72.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.72.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.72.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.73.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.73.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.73.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.74.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.74.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.74.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.75.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.75.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.75.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.76.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.76.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.76.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.77.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.77.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.77.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.78.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.78.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.78.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.79.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.79.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.79.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.8.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.8.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.8.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.80.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.80.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.80.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.81.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.81.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.81.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.82.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.82.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.82.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.83.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.83.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.83.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.84.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.84.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.84.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.85.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.85.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.85.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.86.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.86.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.86.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.87.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.87.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.87.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.88.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.88.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.88.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.89.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.89.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.89.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.9.down_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.9.gate_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.9.up_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.mlp.experts.90.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.90.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.90.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.91.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.91.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.91.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.92.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.92.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.92.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.93.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.93.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.93.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.94.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.94.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.94.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.95.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.95.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.95.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.96.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.96.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.96.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.97.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.97.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.97.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.98.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.98.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.98.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.99.down_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.99.gate_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.experts.99.up_proj.weight": "model-00106-of-00142.safetensors", + "model.layers.69.mlp.gate.e_score_correction_bias": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.gate.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.shared_experts.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.shared_experts.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.mlp.shared_experts.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.69.post_attention_layernorm.weight": "model-00107-of-00142.safetensors", + "model.layers.69.self_attn.k_norm.weight": "model-00105-of-00142.safetensors", + "model.layers.69.self_attn.k_proj.bias": "model-00105-of-00142.safetensors", + "model.layers.69.self_attn.k_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.self_attn.o_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.self_attn.q_norm.weight": "model-00105-of-00142.safetensors", + "model.layers.69.self_attn.q_proj.bias": "model-00105-of-00142.safetensors", + "model.layers.69.self_attn.q_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.69.self_attn.v_proj.bias": "model-00105-of-00142.safetensors", + "model.layers.69.self_attn.v_proj.weight": "model-00105-of-00142.safetensors", + "model.layers.7.input_layernorm.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.0.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.0.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.1.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.1.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.10.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.10.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.10.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.100.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.100.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.100.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.101.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.101.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.101.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.102.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.102.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.102.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.103.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.103.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.103.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.104.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.104.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.104.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.105.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.105.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.105.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.106.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.106.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.106.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.107.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.107.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.107.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.108.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.108.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.108.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.109.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.109.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.109.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.11.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.11.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.11.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.110.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.110.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.110.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.111.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.111.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.111.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.112.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.112.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.112.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.113.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.113.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.113.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.114.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.114.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.114.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.115.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.115.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.115.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.116.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.116.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.116.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.117.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.117.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.117.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.118.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.118.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.118.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.119.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.119.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.119.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.12.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.12.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.12.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.120.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.120.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.120.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.121.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.121.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.121.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.122.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.122.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.122.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.123.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.123.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.123.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.124.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.124.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.124.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.125.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.125.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.125.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.126.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.126.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.126.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.127.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.127.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.127.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.128.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.128.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.128.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.129.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.129.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.129.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.13.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.13.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.13.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.130.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.130.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.130.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.131.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.131.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.131.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.132.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.132.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.132.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.133.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.133.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.133.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.134.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.134.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.134.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.135.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.135.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.135.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.136.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.136.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.136.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.137.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.137.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.137.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.138.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.138.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.138.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.139.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.139.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.139.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.14.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.14.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.14.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.140.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.140.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.140.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.141.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.141.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.141.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.142.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.142.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.142.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.143.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.143.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.143.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.144.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.144.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.144.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.145.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.145.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.145.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.146.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.146.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.146.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.147.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.147.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.147.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.148.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.148.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.148.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.149.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.149.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.149.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.15.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.15.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.15.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.150.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.150.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.150.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.151.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.151.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.151.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.152.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.152.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.152.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.153.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.153.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.153.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.154.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.154.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.154.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.155.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.155.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.155.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.156.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.156.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.156.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.157.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.157.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.157.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.158.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.158.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.158.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.159.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.159.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.159.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.16.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.16.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.16.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.17.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.17.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.17.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.18.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.18.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.18.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.19.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.19.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.19.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.2.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.2.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.20.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.20.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.20.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.21.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.21.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.21.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.22.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.22.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.22.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.23.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.23.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.23.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.24.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.24.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.24.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.25.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.25.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.25.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.26.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.26.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.26.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.27.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.27.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.27.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.28.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.28.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.28.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.29.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.29.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.29.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.3.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.3.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.30.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.30.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.30.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.31.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.31.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.31.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.32.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.32.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.32.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.33.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.33.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.33.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.34.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.34.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.34.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.35.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.35.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.35.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.36.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.36.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.36.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.37.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.37.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.37.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.38.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.38.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.38.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.39.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.39.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.39.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.4.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.4.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.40.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.40.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.40.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.41.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.41.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.41.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.42.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.42.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.42.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.43.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.43.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.43.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.44.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.44.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.44.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.45.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.45.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.45.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.46.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.46.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.46.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.47.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.47.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.47.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.48.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.48.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.48.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.49.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.49.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.49.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.5.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.5.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.50.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.50.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.50.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.51.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.51.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.51.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.52.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.52.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.52.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.53.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.53.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.53.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.54.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.54.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.54.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.55.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.55.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.55.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.56.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.56.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.56.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.57.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.57.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.57.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.58.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.58.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.58.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.59.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.59.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.59.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.6.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.6.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.60.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.60.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.60.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.61.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.61.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.61.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.62.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.62.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.62.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.63.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.63.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.64.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.64.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.65.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.65.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.65.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.66.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.66.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.66.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.67.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.67.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.67.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.68.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.68.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.68.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.69.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.69.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.69.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.7.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.7.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.70.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.70.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.70.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.71.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.71.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.71.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.72.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.72.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.72.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.73.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.73.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.73.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.74.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.74.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.74.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.75.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.75.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.75.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.76.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.76.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.76.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.77.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.77.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.77.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.78.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.78.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.78.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.79.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.79.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.79.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.8.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.8.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.8.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.80.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.80.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.80.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.81.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.81.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.81.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.82.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.82.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.82.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.83.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.83.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.83.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.84.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.84.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.84.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.85.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.85.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.85.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.86.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.86.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.86.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.87.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.87.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.87.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.88.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.88.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.88.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.89.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.89.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.89.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.9.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.9.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.9.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.90.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.90.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.90.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.91.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.91.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.91.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.92.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.92.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.92.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.93.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.93.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.93.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.94.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.94.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.94.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.95.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.95.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.95.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.96.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.96.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.96.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.97.down_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.97.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.97.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.98.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.98.gate_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.98.up_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.mlp.experts.99.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.99.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.experts.99.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.gate.e_score_correction_bias": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.gate.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.shared_experts.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.shared_experts.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.mlp.shared_experts.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00009-of-00142.safetensors", + "model.layers.7.self_attn.k_norm.weight": "model-00008-of-00142.safetensors", + "model.layers.7.self_attn.k_proj.bias": "model-00008-of-00142.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.self_attn.q_norm.weight": "model-00008-of-00142.safetensors", + "model.layers.7.self_attn.q_proj.bias": "model-00008-of-00142.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.7.self_attn.v_proj.bias": "model-00008-of-00142.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00008-of-00142.safetensors", + "model.layers.70.input_layernorm.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.0.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.0.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.0.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.1.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.1.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.1.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.10.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.10.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.10.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.100.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.100.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.100.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.101.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.101.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.101.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.102.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.102.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.102.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.103.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.103.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.103.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.104.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.104.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.104.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.105.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.105.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.105.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.106.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.106.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.106.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.107.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.107.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.107.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.108.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.108.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.108.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.109.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.109.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.109.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.11.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.11.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.11.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.110.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.110.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.110.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.111.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.111.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.111.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.112.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.112.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.112.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.113.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.113.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.113.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.114.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.114.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.114.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.115.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.115.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.115.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.116.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.116.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.116.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.117.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.117.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.117.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.118.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.118.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.118.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.119.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.119.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.119.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.12.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.12.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.12.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.120.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.120.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.120.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.121.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.121.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.121.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.122.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.122.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.122.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.123.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.123.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.123.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.124.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.124.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.124.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.125.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.125.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.125.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.126.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.126.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.126.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.127.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.127.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.127.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.128.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.128.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.128.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.129.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.129.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.129.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.13.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.13.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.13.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.130.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.130.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.130.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.131.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.131.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.131.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.132.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.132.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.132.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.133.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.133.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.133.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.134.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.134.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.134.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.135.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.135.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.135.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.136.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.136.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.136.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.137.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.137.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.137.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.138.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.138.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.138.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.139.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.139.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.139.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.14.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.14.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.14.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.140.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.140.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.140.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.141.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.141.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.141.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.142.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.142.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.142.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.143.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.143.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.143.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.144.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.144.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.144.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.145.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.145.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.145.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.146.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.146.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.146.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.147.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.147.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.147.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.148.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.148.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.148.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.149.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.149.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.149.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.15.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.15.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.15.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.150.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.150.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.150.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.151.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.151.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.151.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.152.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.152.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.152.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.153.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.153.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.153.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.154.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.154.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.154.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.155.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.155.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.155.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.156.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.156.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.156.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.157.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.157.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.157.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.158.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.158.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.158.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.159.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.159.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.159.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.16.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.16.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.16.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.17.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.17.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.17.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.18.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.18.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.18.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.19.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.19.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.19.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.2.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.2.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.2.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.20.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.20.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.20.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.21.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.21.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.21.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.22.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.22.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.22.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.23.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.23.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.23.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.24.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.24.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.24.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.25.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.25.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.25.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.26.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.26.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.26.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.27.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.27.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.27.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.28.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.28.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.28.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.29.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.29.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.29.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.3.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.3.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.3.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.30.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.30.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.30.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.31.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.31.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.31.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.32.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.32.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.32.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.33.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.33.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.33.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.34.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.34.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.34.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.35.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.35.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.35.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.36.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.36.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.36.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.37.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.37.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.37.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.38.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.38.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.38.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.39.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.39.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.39.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.4.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.4.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.4.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.40.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.40.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.40.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.41.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.41.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.41.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.42.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.42.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.42.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.43.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.43.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.43.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.44.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.44.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.44.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.45.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.45.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.45.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.46.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.46.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.46.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.47.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.47.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.47.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.48.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.48.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.48.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.49.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.49.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.49.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.5.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.5.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.5.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.50.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.50.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.50.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.51.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.51.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.51.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.52.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.52.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.52.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.53.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.53.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.53.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.54.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.54.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.54.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.55.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.55.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.55.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.56.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.56.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.56.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.57.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.57.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.57.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.58.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.58.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.58.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.59.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.59.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.59.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.6.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.6.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.6.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.60.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.60.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.60.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.61.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.61.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.61.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.62.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.62.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.62.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.63.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.63.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.63.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.64.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.64.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.64.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.65.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.65.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.65.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.66.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.66.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.66.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.67.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.67.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.67.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.68.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.68.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.68.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.69.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.69.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.69.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.7.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.7.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.7.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.70.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.70.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.70.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.71.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.71.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.71.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.72.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.72.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.72.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.73.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.73.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.73.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.74.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.74.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.74.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.75.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.75.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.75.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.76.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.76.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.76.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.77.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.77.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.77.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.78.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.78.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.78.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.79.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.79.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.79.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.8.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.8.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.8.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.80.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.80.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.80.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.81.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.81.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.81.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.82.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.82.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.82.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.83.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.83.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.83.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.84.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.84.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.84.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.85.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.85.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.85.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.86.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.86.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.86.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.87.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.87.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.87.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.88.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.88.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.88.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.89.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.89.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.89.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.9.down_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.9.gate_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.9.up_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.mlp.experts.90.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.90.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.90.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.91.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.91.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.91.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.92.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.92.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.92.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.93.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.93.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.93.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.94.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.94.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.94.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.95.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.95.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.95.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.96.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.96.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.96.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.97.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.97.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.97.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.98.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.98.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.98.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.99.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.99.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.experts.99.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.gate.e_score_correction_bias": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.gate.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.shared_experts.down_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.shared_experts.gate_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.mlp.shared_experts.up_proj.weight": "model-00108-of-00142.safetensors", + "model.layers.70.post_attention_layernorm.weight": "model-00108-of-00142.safetensors", + "model.layers.70.self_attn.k_norm.weight": "model-00107-of-00142.safetensors", + "model.layers.70.self_attn.k_proj.bias": "model-00107-of-00142.safetensors", + "model.layers.70.self_attn.k_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.self_attn.o_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.self_attn.q_norm.weight": "model-00107-of-00142.safetensors", + "model.layers.70.self_attn.q_proj.bias": "model-00107-of-00142.safetensors", + "model.layers.70.self_attn.q_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.70.self_attn.v_proj.bias": "model-00107-of-00142.safetensors", + "model.layers.70.self_attn.v_proj.weight": "model-00107-of-00142.safetensors", + "model.layers.71.input_layernorm.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.0.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.0.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.0.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.1.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.1.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.1.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.10.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.10.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.10.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.100.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.100.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.100.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.101.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.101.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.101.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.102.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.102.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.102.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.103.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.103.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.103.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.104.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.104.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.104.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.105.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.105.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.105.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.106.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.106.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.106.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.107.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.107.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.107.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.108.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.108.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.108.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.109.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.109.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.109.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.11.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.11.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.11.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.110.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.110.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.110.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.111.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.111.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.111.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.112.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.112.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.112.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.113.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.113.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.113.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.114.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.114.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.114.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.115.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.115.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.115.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.116.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.116.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.116.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.117.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.117.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.117.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.118.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.118.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.118.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.119.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.119.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.119.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.12.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.12.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.12.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.120.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.120.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.120.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.121.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.121.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.121.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.122.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.122.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.122.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.123.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.123.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.123.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.124.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.124.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.124.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.125.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.125.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.125.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.126.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.126.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.126.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.127.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.127.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.127.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.128.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.128.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.128.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.129.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.129.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.129.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.13.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.13.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.13.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.130.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.130.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.130.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.131.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.131.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.131.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.132.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.132.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.132.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.133.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.133.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.133.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.134.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.134.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.134.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.135.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.135.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.135.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.136.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.136.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.136.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.137.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.137.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.137.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.138.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.138.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.138.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.139.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.139.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.139.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.14.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.14.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.14.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.140.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.140.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.140.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.141.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.141.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.141.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.142.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.142.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.142.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.143.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.143.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.143.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.144.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.144.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.144.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.145.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.145.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.145.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.146.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.146.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.146.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.147.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.147.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.147.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.148.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.148.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.148.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.149.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.149.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.149.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.15.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.15.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.15.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.150.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.150.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.150.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.151.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.151.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.151.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.152.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.152.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.152.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.153.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.153.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.153.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.154.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.154.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.154.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.155.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.155.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.155.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.156.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.156.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.156.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.157.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.157.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.157.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.158.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.158.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.158.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.159.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.159.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.159.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.experts.16.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.16.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.16.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.17.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.17.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.17.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.18.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.18.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.18.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.19.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.19.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.19.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.2.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.2.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.2.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.20.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.20.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.20.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.21.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.21.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.21.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.22.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.22.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.22.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.23.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.23.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.23.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.24.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.24.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.24.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.25.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.25.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.25.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.26.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.26.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.26.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.27.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.27.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.27.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.28.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.28.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.28.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.29.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.29.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.29.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.3.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.3.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.3.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.30.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.30.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.30.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.31.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.31.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.31.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.32.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.32.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.32.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.33.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.33.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.33.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.34.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.34.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.34.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.35.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.35.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.35.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.36.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.36.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.36.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.37.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.37.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.37.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.38.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.38.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.38.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.39.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.39.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.39.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.4.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.4.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.4.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.40.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.40.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.40.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.41.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.41.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.41.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.42.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.42.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.42.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.43.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.43.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.43.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.44.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.44.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.44.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.45.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.45.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.45.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.46.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.46.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.46.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.47.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.47.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.47.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.48.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.48.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.48.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.49.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.49.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.49.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.5.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.5.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.5.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.50.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.50.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.50.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.51.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.51.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.51.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.52.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.52.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.52.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.53.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.53.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.53.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.54.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.54.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.54.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.55.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.55.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.55.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.56.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.56.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.56.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.57.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.57.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.57.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.58.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.58.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.58.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.59.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.59.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.59.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.6.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.6.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.6.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.60.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.60.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.60.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.61.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.61.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.61.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.62.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.62.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.62.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.63.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.63.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.63.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.64.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.64.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.64.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.65.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.65.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.65.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.66.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.66.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.66.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.67.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.67.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.67.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.68.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.68.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.68.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.69.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.69.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.69.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.7.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.7.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.7.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.70.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.70.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.70.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.71.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.71.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.71.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.72.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.72.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.72.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.73.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.73.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.73.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.74.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.74.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.74.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.75.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.75.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.75.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.76.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.76.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.76.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.77.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.77.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.77.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.78.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.78.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.78.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.79.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.79.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.79.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.8.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.8.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.8.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.80.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.80.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.80.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.81.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.81.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.81.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.82.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.82.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.82.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.83.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.83.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.83.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.84.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.84.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.84.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.85.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.85.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.85.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.86.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.86.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.86.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.87.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.87.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.87.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.88.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.88.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.88.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.89.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.89.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.89.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.9.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.9.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.9.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.90.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.90.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.90.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.91.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.91.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.91.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.92.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.92.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.92.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.93.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.93.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.93.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.94.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.94.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.94.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.95.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.95.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.95.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.96.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.96.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.96.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.97.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.97.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.97.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.98.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.98.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.98.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.99.down_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.99.gate_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.experts.99.up_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.mlp.gate.e_score_correction_bias": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.gate.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.shared_experts.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.shared_experts.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.mlp.shared_experts.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.71.post_attention_layernorm.weight": "model-00110-of-00142.safetensors", + "model.layers.71.self_attn.k_norm.weight": "model-00109-of-00142.safetensors", + "model.layers.71.self_attn.k_proj.bias": "model-00109-of-00142.safetensors", + "model.layers.71.self_attn.k_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.self_attn.o_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.self_attn.q_norm.weight": "model-00109-of-00142.safetensors", + "model.layers.71.self_attn.q_proj.bias": "model-00109-of-00142.safetensors", + "model.layers.71.self_attn.q_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.71.self_attn.v_proj.bias": "model-00109-of-00142.safetensors", + "model.layers.71.self_attn.v_proj.weight": "model-00109-of-00142.safetensors", + "model.layers.72.input_layernorm.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.0.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.0.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.0.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.1.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.1.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.1.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.10.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.10.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.10.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.100.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.100.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.100.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.101.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.101.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.101.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.102.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.102.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.102.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.103.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.103.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.103.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.104.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.104.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.104.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.105.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.105.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.105.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.106.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.106.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.106.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.107.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.107.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.107.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.108.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.108.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.108.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.109.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.109.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.109.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.11.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.11.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.11.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.110.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.110.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.110.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.111.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.111.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.111.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.112.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.112.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.112.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.113.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.113.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.113.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.114.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.114.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.114.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.115.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.115.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.115.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.116.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.116.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.116.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.117.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.117.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.117.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.118.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.118.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.118.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.119.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.119.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.119.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.12.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.12.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.12.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.120.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.120.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.120.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.121.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.121.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.121.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.122.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.122.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.122.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.123.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.123.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.123.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.124.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.124.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.124.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.125.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.125.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.125.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.126.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.126.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.126.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.127.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.127.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.127.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.128.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.128.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.128.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.129.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.129.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.129.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.13.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.13.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.13.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.130.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.130.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.130.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.131.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.131.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.131.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.132.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.132.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.132.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.133.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.133.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.133.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.134.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.134.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.134.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.135.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.135.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.135.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.136.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.136.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.136.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.137.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.137.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.137.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.138.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.138.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.138.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.139.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.139.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.139.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.14.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.14.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.14.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.140.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.140.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.140.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.141.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.141.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.141.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.142.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.142.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.142.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.143.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.143.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.143.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.144.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.144.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.144.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.145.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.145.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.145.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.146.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.146.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.146.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.147.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.147.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.147.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.148.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.148.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.148.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.149.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.149.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.149.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.15.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.15.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.15.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.150.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.150.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.150.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.151.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.151.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.151.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.152.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.152.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.152.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.153.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.153.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.153.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.154.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.154.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.154.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.155.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.155.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.155.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.156.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.156.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.156.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.157.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.157.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.157.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.158.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.158.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.158.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.159.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.159.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.159.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.experts.16.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.16.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.16.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.17.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.17.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.17.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.18.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.18.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.18.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.19.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.19.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.19.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.2.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.2.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.2.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.20.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.20.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.20.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.21.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.21.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.21.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.22.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.22.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.22.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.23.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.23.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.23.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.24.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.24.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.24.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.25.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.25.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.25.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.26.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.26.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.26.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.27.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.27.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.27.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.28.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.28.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.28.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.29.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.29.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.29.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.3.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.3.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.3.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.30.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.30.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.30.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.31.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.31.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.31.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.32.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.32.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.32.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.33.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.33.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.33.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.34.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.34.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.34.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.35.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.35.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.35.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.36.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.36.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.36.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.37.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.37.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.37.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.38.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.38.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.38.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.39.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.39.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.39.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.4.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.4.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.4.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.40.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.40.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.40.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.41.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.41.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.41.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.42.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.42.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.42.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.43.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.43.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.43.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.44.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.44.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.44.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.45.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.45.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.45.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.46.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.46.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.46.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.47.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.47.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.47.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.48.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.48.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.48.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.49.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.49.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.49.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.5.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.5.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.5.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.50.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.50.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.50.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.51.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.51.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.51.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.52.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.52.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.52.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.53.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.53.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.53.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.54.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.54.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.54.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.55.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.55.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.55.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.56.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.56.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.56.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.57.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.57.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.57.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.58.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.58.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.58.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.59.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.59.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.59.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.6.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.6.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.6.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.60.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.60.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.60.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.61.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.61.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.61.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.62.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.62.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.62.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.63.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.63.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.63.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.64.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.64.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.64.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.65.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.65.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.65.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.66.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.66.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.66.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.67.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.67.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.67.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.68.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.68.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.68.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.69.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.69.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.69.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.7.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.7.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.7.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.70.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.70.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.70.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.71.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.71.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.71.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.72.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.72.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.72.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.73.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.73.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.73.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.74.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.74.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.74.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.75.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.75.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.75.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.76.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.76.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.76.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.77.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.77.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.77.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.78.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.78.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.78.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.79.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.79.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.79.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.8.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.8.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.8.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.80.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.80.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.80.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.81.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.81.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.81.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.82.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.82.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.82.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.83.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.83.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.83.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.84.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.84.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.84.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.85.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.85.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.85.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.86.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.86.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.86.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.87.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.87.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.87.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.88.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.88.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.88.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.89.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.89.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.89.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.9.down_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.9.gate_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.9.up_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.mlp.experts.90.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.90.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.90.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.91.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.91.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.91.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.92.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.92.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.92.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.93.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.93.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.93.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.94.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.94.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.94.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.95.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.95.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.95.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.96.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.96.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.96.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.97.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.97.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.97.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.98.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.98.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.98.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.99.down_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.99.gate_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.experts.99.up_proj.weight": "model-00111-of-00142.safetensors", + "model.layers.72.mlp.gate.e_score_correction_bias": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.gate.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.shared_experts.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.shared_experts.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.mlp.shared_experts.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.72.post_attention_layernorm.weight": "model-00112-of-00142.safetensors", + "model.layers.72.self_attn.k_norm.weight": "model-00110-of-00142.safetensors", + "model.layers.72.self_attn.k_proj.bias": "model-00110-of-00142.safetensors", + "model.layers.72.self_attn.k_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.self_attn.o_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.self_attn.q_norm.weight": "model-00110-of-00142.safetensors", + "model.layers.72.self_attn.q_proj.bias": "model-00110-of-00142.safetensors", + "model.layers.72.self_attn.q_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.72.self_attn.v_proj.bias": "model-00110-of-00142.safetensors", + "model.layers.72.self_attn.v_proj.weight": "model-00110-of-00142.safetensors", + "model.layers.73.input_layernorm.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.0.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.0.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.0.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.1.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.1.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.1.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.10.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.10.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.10.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.100.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.100.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.100.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.101.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.101.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.101.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.102.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.102.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.102.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.103.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.103.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.103.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.104.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.104.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.104.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.105.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.105.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.105.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.106.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.106.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.106.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.107.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.107.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.107.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.108.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.108.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.108.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.109.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.109.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.109.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.11.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.11.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.11.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.110.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.110.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.110.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.111.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.111.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.111.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.112.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.112.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.112.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.113.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.113.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.113.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.114.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.114.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.114.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.115.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.115.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.115.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.116.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.116.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.116.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.117.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.117.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.117.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.118.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.118.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.118.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.119.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.119.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.119.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.12.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.12.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.12.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.120.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.120.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.120.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.121.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.121.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.121.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.122.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.122.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.122.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.123.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.123.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.123.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.124.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.124.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.124.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.125.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.125.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.125.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.126.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.126.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.126.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.127.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.127.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.127.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.128.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.128.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.128.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.129.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.129.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.129.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.13.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.13.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.13.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.130.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.130.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.130.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.131.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.131.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.131.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.132.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.132.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.132.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.133.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.133.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.133.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.134.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.134.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.134.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.135.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.135.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.135.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.136.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.136.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.136.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.137.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.137.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.137.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.138.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.138.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.138.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.139.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.139.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.139.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.14.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.14.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.14.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.140.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.140.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.140.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.141.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.141.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.141.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.142.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.142.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.142.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.143.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.143.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.143.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.144.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.144.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.144.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.145.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.145.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.145.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.146.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.146.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.146.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.147.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.147.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.147.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.148.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.148.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.148.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.149.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.149.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.149.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.15.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.15.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.15.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.150.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.150.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.150.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.151.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.151.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.151.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.152.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.152.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.152.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.153.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.153.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.153.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.154.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.154.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.154.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.155.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.155.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.155.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.156.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.156.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.156.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.157.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.157.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.157.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.158.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.158.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.158.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.159.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.159.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.159.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.16.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.16.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.16.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.17.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.17.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.17.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.18.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.18.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.18.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.19.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.19.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.19.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.2.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.2.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.2.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.20.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.20.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.20.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.21.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.21.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.21.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.22.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.22.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.22.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.23.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.23.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.23.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.24.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.24.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.24.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.25.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.25.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.25.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.26.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.26.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.26.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.27.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.27.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.27.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.28.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.28.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.28.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.29.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.29.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.29.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.3.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.3.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.3.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.30.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.30.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.30.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.31.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.31.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.31.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.32.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.32.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.32.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.33.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.33.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.33.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.34.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.34.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.34.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.35.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.35.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.35.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.36.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.36.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.36.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.37.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.37.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.37.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.38.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.38.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.38.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.39.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.39.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.39.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.4.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.4.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.4.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.40.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.40.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.40.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.41.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.41.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.41.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.42.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.42.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.42.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.43.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.43.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.43.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.44.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.44.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.44.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.45.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.45.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.45.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.46.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.46.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.46.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.47.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.47.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.47.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.48.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.48.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.48.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.49.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.49.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.49.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.5.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.5.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.5.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.50.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.50.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.50.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.51.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.51.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.51.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.52.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.52.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.52.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.53.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.53.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.53.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.54.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.54.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.54.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.55.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.55.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.55.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.56.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.56.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.56.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.57.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.57.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.57.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.58.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.58.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.58.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.59.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.59.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.59.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.6.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.6.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.6.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.60.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.60.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.60.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.61.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.61.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.61.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.62.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.62.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.62.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.63.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.63.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.63.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.64.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.64.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.64.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.65.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.65.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.65.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.66.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.66.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.66.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.67.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.67.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.67.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.68.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.68.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.68.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.69.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.69.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.69.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.7.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.7.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.7.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.70.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.70.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.70.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.71.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.71.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.71.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.72.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.72.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.72.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.73.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.73.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.73.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.74.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.74.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.74.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.75.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.75.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.75.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.76.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.76.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.76.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.77.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.77.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.77.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.78.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.78.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.78.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.79.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.79.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.79.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.8.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.8.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.8.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.80.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.80.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.80.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.81.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.81.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.81.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.82.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.82.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.82.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.83.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.83.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.83.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.84.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.84.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.84.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.85.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.85.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.85.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.86.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.86.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.86.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.87.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.87.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.87.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.88.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.88.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.88.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.89.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.89.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.89.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.9.down_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.9.gate_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.9.up_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.mlp.experts.90.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.90.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.90.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.91.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.91.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.91.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.92.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.92.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.92.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.93.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.93.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.93.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.94.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.94.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.94.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.95.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.95.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.95.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.96.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.96.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.96.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.97.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.97.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.97.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.98.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.98.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.98.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.99.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.99.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.experts.99.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.gate.e_score_correction_bias": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.gate.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.shared_experts.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.shared_experts.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.mlp.shared_experts.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.73.post_attention_layernorm.weight": "model-00113-of-00142.safetensors", + "model.layers.73.self_attn.k_norm.weight": "model-00112-of-00142.safetensors", + "model.layers.73.self_attn.k_proj.bias": "model-00112-of-00142.safetensors", + "model.layers.73.self_attn.k_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.self_attn.o_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.self_attn.q_norm.weight": "model-00112-of-00142.safetensors", + "model.layers.73.self_attn.q_proj.bias": "model-00112-of-00142.safetensors", + "model.layers.73.self_attn.q_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.73.self_attn.v_proj.bias": "model-00112-of-00142.safetensors", + "model.layers.73.self_attn.v_proj.weight": "model-00112-of-00142.safetensors", + "model.layers.74.input_layernorm.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.0.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.0.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.0.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.1.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.1.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.1.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.10.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.10.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.10.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.100.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.100.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.100.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.101.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.101.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.101.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.102.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.102.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.102.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.103.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.103.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.103.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.104.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.104.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.104.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.105.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.105.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.105.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.106.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.106.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.106.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.107.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.107.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.107.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.108.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.108.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.108.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.109.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.109.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.109.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.11.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.11.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.11.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.110.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.110.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.110.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.111.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.111.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.111.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.112.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.112.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.112.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.113.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.113.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.113.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.114.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.114.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.114.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.115.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.115.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.115.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.116.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.116.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.116.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.117.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.117.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.117.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.118.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.118.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.118.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.119.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.119.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.119.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.12.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.12.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.12.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.120.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.120.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.120.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.121.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.121.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.121.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.122.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.122.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.122.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.123.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.123.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.123.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.124.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.124.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.124.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.125.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.125.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.125.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.126.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.126.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.126.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.127.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.127.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.127.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.128.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.128.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.128.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.129.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.129.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.129.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.13.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.13.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.13.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.130.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.130.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.130.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.131.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.131.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.131.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.132.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.132.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.132.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.133.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.133.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.133.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.134.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.134.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.134.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.135.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.135.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.135.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.136.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.136.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.136.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.137.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.137.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.137.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.138.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.138.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.138.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.139.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.139.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.139.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.14.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.14.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.14.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.140.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.140.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.140.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.141.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.141.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.141.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.142.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.142.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.142.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.143.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.143.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.143.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.144.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.144.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.144.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.145.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.145.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.145.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.146.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.146.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.146.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.147.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.147.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.147.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.148.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.148.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.148.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.149.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.149.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.149.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.15.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.15.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.15.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.150.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.150.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.150.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.151.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.151.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.151.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.152.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.152.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.152.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.153.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.153.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.153.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.154.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.154.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.154.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.155.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.155.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.155.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.156.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.156.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.156.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.157.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.157.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.157.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.158.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.158.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.158.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.159.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.159.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.159.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.experts.16.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.16.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.16.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.17.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.17.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.17.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.18.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.18.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.18.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.19.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.19.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.19.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.2.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.2.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.2.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.20.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.20.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.20.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.21.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.21.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.21.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.22.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.22.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.22.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.23.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.23.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.23.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.24.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.24.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.24.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.25.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.25.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.25.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.26.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.26.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.26.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.27.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.27.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.27.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.28.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.28.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.28.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.29.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.29.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.29.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.3.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.3.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.3.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.30.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.30.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.30.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.31.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.31.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.31.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.32.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.32.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.32.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.33.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.33.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.33.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.34.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.34.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.34.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.35.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.35.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.35.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.36.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.36.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.36.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.37.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.37.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.37.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.38.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.38.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.38.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.39.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.39.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.39.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.4.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.4.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.4.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.40.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.40.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.40.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.41.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.41.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.41.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.42.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.42.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.42.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.43.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.43.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.43.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.44.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.44.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.44.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.45.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.45.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.45.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.46.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.46.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.46.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.47.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.47.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.47.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.48.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.48.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.48.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.49.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.49.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.49.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.5.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.5.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.5.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.50.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.50.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.50.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.51.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.51.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.51.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.52.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.52.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.52.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.53.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.53.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.53.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.54.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.54.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.54.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.55.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.55.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.55.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.56.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.56.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.56.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.57.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.57.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.57.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.58.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.58.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.58.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.59.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.59.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.59.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.6.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.6.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.6.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.60.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.60.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.60.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.61.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.61.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.61.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.62.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.62.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.62.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.63.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.63.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.63.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.64.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.64.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.64.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.65.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.65.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.65.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.66.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.66.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.66.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.67.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.67.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.67.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.68.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.68.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.68.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.69.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.69.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.69.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.7.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.7.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.7.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.70.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.70.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.70.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.71.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.71.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.71.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.72.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.72.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.72.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.73.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.73.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.73.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.74.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.74.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.74.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.75.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.75.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.75.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.76.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.76.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.76.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.77.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.77.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.77.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.78.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.78.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.78.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.79.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.79.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.79.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.8.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.8.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.8.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.80.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.80.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.80.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.81.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.81.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.81.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.82.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.82.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.82.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.83.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.83.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.83.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.84.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.84.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.84.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.85.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.85.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.85.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.86.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.86.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.86.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.87.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.87.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.87.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.88.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.88.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.88.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.89.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.89.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.89.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.9.down_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.9.gate_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.9.up_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.mlp.experts.90.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.90.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.90.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.91.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.91.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.91.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.92.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.92.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.92.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.93.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.93.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.93.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.94.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.94.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.94.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.95.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.95.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.95.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.96.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.96.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.96.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.97.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.97.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.97.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.98.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.98.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.98.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.99.down_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.99.gate_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.experts.99.up_proj.weight": "model-00114-of-00142.safetensors", + "model.layers.74.mlp.gate.e_score_correction_bias": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.gate.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.shared_experts.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.shared_experts.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.mlp.shared_experts.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.74.post_attention_layernorm.weight": "model-00115-of-00142.safetensors", + "model.layers.74.self_attn.k_norm.weight": "model-00113-of-00142.safetensors", + "model.layers.74.self_attn.k_proj.bias": "model-00113-of-00142.safetensors", + "model.layers.74.self_attn.k_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.self_attn.o_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.self_attn.q_norm.weight": "model-00113-of-00142.safetensors", + "model.layers.74.self_attn.q_proj.bias": "model-00113-of-00142.safetensors", + "model.layers.74.self_attn.q_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.74.self_attn.v_proj.bias": "model-00113-of-00142.safetensors", + "model.layers.74.self_attn.v_proj.weight": "model-00113-of-00142.safetensors", + "model.layers.75.input_layernorm.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.0.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.0.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.0.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.1.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.1.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.1.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.10.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.10.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.10.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.100.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.100.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.100.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.101.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.101.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.101.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.102.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.102.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.102.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.103.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.103.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.103.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.104.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.104.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.104.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.105.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.105.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.105.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.106.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.106.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.106.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.107.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.107.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.107.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.108.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.108.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.108.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.109.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.109.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.109.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.11.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.11.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.11.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.110.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.110.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.110.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.111.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.111.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.111.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.112.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.112.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.112.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.113.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.113.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.113.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.114.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.114.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.114.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.115.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.115.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.115.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.116.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.116.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.116.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.117.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.117.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.117.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.118.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.118.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.118.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.119.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.119.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.119.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.12.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.12.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.12.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.120.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.120.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.120.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.121.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.121.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.121.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.122.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.122.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.122.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.123.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.123.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.123.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.124.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.124.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.124.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.125.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.125.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.125.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.126.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.126.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.126.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.127.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.127.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.127.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.128.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.128.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.128.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.129.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.129.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.129.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.13.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.13.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.13.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.130.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.130.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.130.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.131.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.131.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.131.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.132.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.132.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.132.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.133.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.133.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.133.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.134.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.134.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.134.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.135.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.135.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.135.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.136.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.136.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.136.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.137.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.137.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.137.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.138.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.138.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.138.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.139.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.139.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.139.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.14.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.14.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.14.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.140.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.140.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.140.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.141.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.141.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.141.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.142.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.142.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.142.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.143.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.143.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.143.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.144.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.144.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.144.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.145.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.145.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.145.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.146.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.146.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.146.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.147.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.147.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.147.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.148.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.148.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.148.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.149.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.149.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.149.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.15.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.15.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.15.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.150.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.150.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.150.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.151.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.151.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.151.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.152.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.152.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.152.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.153.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.153.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.153.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.154.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.154.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.154.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.155.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.155.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.155.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.156.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.156.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.156.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.157.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.157.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.157.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.158.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.158.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.158.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.159.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.159.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.159.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.16.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.16.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.16.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.17.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.17.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.17.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.18.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.18.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.18.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.19.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.19.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.19.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.2.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.2.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.2.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.20.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.20.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.20.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.21.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.21.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.21.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.22.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.22.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.22.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.23.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.23.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.23.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.24.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.24.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.24.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.25.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.25.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.25.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.26.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.26.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.26.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.27.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.27.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.27.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.28.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.28.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.28.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.29.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.29.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.29.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.3.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.3.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.3.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.30.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.30.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.30.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.31.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.31.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.31.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.32.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.32.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.32.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.33.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.33.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.33.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.34.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.34.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.34.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.35.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.35.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.35.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.36.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.36.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.36.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.37.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.37.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.37.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.38.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.38.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.38.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.39.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.39.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.39.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.4.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.4.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.4.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.40.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.40.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.40.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.41.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.41.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.41.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.42.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.42.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.42.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.43.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.43.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.43.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.44.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.44.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.44.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.45.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.45.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.45.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.46.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.46.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.46.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.47.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.47.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.47.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.48.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.48.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.48.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.49.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.49.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.49.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.5.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.5.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.5.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.50.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.50.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.50.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.51.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.51.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.51.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.52.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.52.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.52.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.53.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.53.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.53.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.54.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.54.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.54.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.55.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.55.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.55.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.56.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.56.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.56.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.57.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.57.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.57.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.58.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.58.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.58.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.59.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.59.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.59.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.6.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.6.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.6.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.60.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.60.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.60.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.61.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.61.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.61.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.62.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.62.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.62.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.63.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.63.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.63.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.64.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.64.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.64.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.65.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.65.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.65.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.66.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.66.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.66.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.67.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.67.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.67.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.68.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.68.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.68.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.69.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.69.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.69.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.7.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.7.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.7.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.70.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.70.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.70.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.71.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.71.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.71.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.72.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.72.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.72.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.73.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.73.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.73.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.74.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.74.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.74.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.75.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.75.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.75.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.76.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.76.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.76.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.77.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.77.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.77.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.78.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.78.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.78.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.79.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.79.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.79.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.8.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.8.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.8.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.80.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.80.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.80.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.81.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.81.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.81.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.82.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.82.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.82.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.83.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.83.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.83.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.84.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.84.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.84.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.85.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.85.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.85.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.86.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.86.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.86.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.87.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.87.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.87.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.88.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.88.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.88.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.89.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.89.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.89.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.9.down_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.9.gate_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.9.up_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.mlp.experts.90.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.90.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.90.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.91.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.91.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.91.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.92.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.92.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.92.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.93.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.93.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.93.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.94.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.94.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.94.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.95.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.95.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.95.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.96.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.96.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.96.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.97.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.97.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.97.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.98.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.98.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.98.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.99.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.99.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.experts.99.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.gate.e_score_correction_bias": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.gate.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.shared_experts.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.shared_experts.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.mlp.shared_experts.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.75.post_attention_layernorm.weight": "model-00116-of-00142.safetensors", + "model.layers.75.self_attn.k_norm.weight": "model-00115-of-00142.safetensors", + "model.layers.75.self_attn.k_proj.bias": "model-00115-of-00142.safetensors", + "model.layers.75.self_attn.k_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.self_attn.o_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.self_attn.q_norm.weight": "model-00115-of-00142.safetensors", + "model.layers.75.self_attn.q_proj.bias": "model-00115-of-00142.safetensors", + "model.layers.75.self_attn.q_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.75.self_attn.v_proj.bias": "model-00115-of-00142.safetensors", + "model.layers.75.self_attn.v_proj.weight": "model-00115-of-00142.safetensors", + "model.layers.76.input_layernorm.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.0.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.0.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.0.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.1.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.1.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.1.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.10.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.10.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.10.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.100.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.100.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.100.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.101.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.101.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.101.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.102.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.102.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.102.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.103.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.103.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.103.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.104.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.104.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.104.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.105.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.105.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.105.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.106.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.106.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.106.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.107.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.107.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.107.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.108.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.108.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.108.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.109.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.109.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.109.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.11.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.11.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.11.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.110.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.110.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.110.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.111.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.111.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.111.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.112.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.112.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.112.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.113.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.113.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.113.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.114.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.114.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.114.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.115.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.115.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.115.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.116.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.116.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.116.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.117.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.117.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.117.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.118.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.118.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.118.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.119.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.119.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.119.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.12.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.12.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.12.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.120.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.120.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.120.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.121.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.121.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.121.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.122.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.122.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.122.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.123.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.123.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.123.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.124.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.124.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.124.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.125.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.125.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.125.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.126.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.126.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.126.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.127.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.127.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.127.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.128.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.128.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.128.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.129.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.129.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.129.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.13.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.13.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.13.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.130.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.130.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.130.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.131.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.131.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.131.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.132.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.132.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.132.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.133.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.133.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.133.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.134.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.134.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.134.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.135.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.135.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.135.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.136.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.136.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.136.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.137.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.137.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.137.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.138.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.138.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.138.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.139.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.139.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.139.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.14.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.14.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.14.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.140.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.140.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.140.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.141.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.141.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.141.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.142.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.142.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.142.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.143.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.143.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.143.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.144.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.144.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.144.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.145.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.145.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.145.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.146.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.146.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.146.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.147.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.147.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.147.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.148.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.148.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.148.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.149.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.149.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.149.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.15.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.15.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.15.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.150.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.150.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.150.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.151.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.151.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.151.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.152.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.152.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.152.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.153.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.153.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.153.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.154.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.154.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.154.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.155.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.155.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.155.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.156.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.156.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.156.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.157.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.157.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.157.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.158.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.158.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.158.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.159.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.159.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.159.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.experts.16.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.16.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.16.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.17.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.17.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.17.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.18.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.18.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.18.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.19.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.19.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.19.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.2.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.2.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.2.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.20.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.20.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.20.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.21.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.21.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.21.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.22.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.22.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.22.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.23.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.23.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.23.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.24.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.24.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.24.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.25.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.25.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.25.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.26.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.26.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.26.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.27.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.27.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.27.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.28.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.28.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.28.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.29.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.29.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.29.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.3.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.3.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.3.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.30.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.30.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.30.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.31.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.31.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.31.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.32.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.32.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.32.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.33.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.33.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.33.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.34.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.34.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.34.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.35.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.35.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.35.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.36.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.36.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.36.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.37.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.37.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.37.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.38.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.38.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.38.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.39.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.39.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.39.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.4.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.4.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.4.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.40.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.40.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.40.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.41.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.41.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.41.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.42.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.42.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.42.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.43.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.43.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.43.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.44.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.44.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.44.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.45.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.45.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.45.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.46.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.46.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.46.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.47.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.47.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.47.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.48.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.48.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.48.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.49.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.49.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.49.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.5.down_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.5.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.5.up_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.50.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.50.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.50.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.51.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.51.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.51.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.52.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.52.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.52.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.53.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.53.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.53.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.54.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.54.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.54.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.55.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.55.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.55.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.56.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.56.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.56.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.57.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.57.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.57.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.58.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.58.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.58.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.59.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.59.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.59.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.6.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.6.gate_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.mlp.experts.6.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.60.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.60.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.60.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.61.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.61.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.61.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.62.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.62.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.62.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.63.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.63.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.63.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.64.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.64.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.64.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.65.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.65.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.65.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.66.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.66.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.66.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.67.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.67.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.67.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.68.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.68.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.68.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.69.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.69.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.69.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.7.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.7.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.7.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.70.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.70.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.70.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.71.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.71.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.71.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.72.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.72.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.72.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.73.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.73.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.73.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.74.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.74.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.74.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.75.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.75.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.75.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.76.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.76.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.76.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.77.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.77.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.77.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.78.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.78.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.78.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.79.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.79.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.79.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.8.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.8.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.8.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.80.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.80.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.80.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.81.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.81.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.81.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.82.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.82.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.82.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.83.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.83.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.83.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.84.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.84.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.84.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.85.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.85.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.85.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.86.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.86.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.86.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.87.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.87.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.87.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.88.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.88.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.88.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.89.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.89.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.89.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.9.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.9.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.9.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.90.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.90.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.90.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.91.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.91.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.91.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.92.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.92.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.92.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.93.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.93.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.93.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.94.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.94.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.94.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.95.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.95.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.95.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.96.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.96.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.96.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.97.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.97.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.97.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.98.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.98.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.98.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.99.down_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.99.gate_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.experts.99.up_proj.weight": "model-00117-of-00142.safetensors", + "model.layers.76.mlp.gate.e_score_correction_bias": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.gate.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.shared_experts.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.shared_experts.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.mlp.shared_experts.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.76.post_attention_layernorm.weight": "model-00118-of-00142.safetensors", + "model.layers.76.self_attn.k_norm.weight": "model-00116-of-00142.safetensors", + "model.layers.76.self_attn.k_proj.bias": "model-00116-of-00142.safetensors", + "model.layers.76.self_attn.k_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.self_attn.o_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.self_attn.q_norm.weight": "model-00116-of-00142.safetensors", + "model.layers.76.self_attn.q_proj.bias": "model-00116-of-00142.safetensors", + "model.layers.76.self_attn.q_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.76.self_attn.v_proj.bias": "model-00116-of-00142.safetensors", + "model.layers.76.self_attn.v_proj.weight": "model-00116-of-00142.safetensors", + "model.layers.77.input_layernorm.weight": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.experts.0.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.0.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.0.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.1.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.1.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.1.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.10.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.10.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.10.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.100.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.100.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.100.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.101.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.101.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.101.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.102.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.102.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.102.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.103.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.103.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.103.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.104.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.104.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.104.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.105.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.105.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.105.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.106.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.106.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.106.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.107.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.107.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.107.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.108.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.108.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.108.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.109.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.109.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.109.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.11.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.11.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.11.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.110.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.110.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.110.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.111.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.111.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.111.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.112.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.112.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.112.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.113.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.113.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.113.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.114.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.114.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.114.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.115.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.115.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.115.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.116.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.116.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.116.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.117.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.117.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.117.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.118.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.118.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.118.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.119.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.119.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.119.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.12.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.12.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.12.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.120.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.120.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.120.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.121.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.121.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.121.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.122.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.122.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.122.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.123.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.123.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.123.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.124.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.124.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.124.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.125.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.125.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.125.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.126.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.126.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.126.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.127.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.127.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.127.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.128.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.128.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.128.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.129.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.129.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.129.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.13.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.13.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.13.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.130.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.130.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.130.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.131.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.131.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.131.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.132.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.132.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.132.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.133.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.133.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.133.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.134.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.134.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.134.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.135.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.135.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.135.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.136.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.136.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.136.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.137.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.137.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.137.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.138.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.138.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.138.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.139.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.139.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.139.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.14.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.14.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.14.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.140.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.140.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.140.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.141.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.141.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.141.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.142.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.142.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.142.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.143.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.143.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.143.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.144.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.144.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.144.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.145.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.145.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.145.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.146.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.146.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.146.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.147.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.147.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.147.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.148.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.148.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.148.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.149.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.149.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.149.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.15.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.15.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.15.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.150.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.150.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.150.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.151.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.151.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.151.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.152.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.152.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.152.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.153.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.153.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.153.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.154.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.154.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.154.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.155.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.155.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.155.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.156.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.experts.156.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.156.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.157.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.experts.157.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.experts.157.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.experts.158.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.experts.158.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.experts.158.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.experts.159.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.experts.159.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.experts.159.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.experts.16.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.16.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.16.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.17.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.17.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.17.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.18.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.18.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.18.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.19.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.19.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.19.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.2.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.2.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.2.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.20.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.20.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.20.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.21.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.21.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.21.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.22.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.22.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.22.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.23.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.23.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.23.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.24.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.24.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.24.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.25.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.25.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.25.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.26.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.26.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.26.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.27.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.27.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.27.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.28.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.28.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.28.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.29.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.29.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.29.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.3.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.3.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.3.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.30.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.30.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.30.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.31.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.31.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.31.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.32.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.32.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.32.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.33.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.33.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.33.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.34.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.34.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.34.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.35.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.35.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.35.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.36.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.36.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.36.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.37.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.37.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.37.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.38.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.38.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.38.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.39.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.39.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.39.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.4.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.4.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.4.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.40.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.40.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.40.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.41.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.41.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.41.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.42.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.42.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.42.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.43.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.43.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.43.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.44.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.44.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.44.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.45.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.45.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.45.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.46.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.46.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.46.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.47.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.47.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.47.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.48.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.48.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.48.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.49.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.49.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.49.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.5.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.5.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.5.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.50.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.50.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.50.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.51.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.51.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.51.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.52.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.52.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.52.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.53.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.53.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.53.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.54.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.54.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.54.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.55.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.55.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.55.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.56.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.56.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.56.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.57.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.57.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.57.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.58.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.58.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.58.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.59.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.59.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.59.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.6.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.6.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.6.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.60.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.60.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.60.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.61.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.61.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.61.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.62.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.62.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.62.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.63.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.63.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.63.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.64.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.64.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.64.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.65.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.65.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.65.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.66.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.66.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.66.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.67.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.67.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.67.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.68.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.68.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.68.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.69.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.69.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.69.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.7.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.7.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.7.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.70.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.70.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.70.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.71.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.71.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.71.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.72.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.72.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.72.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.73.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.73.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.73.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.74.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.74.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.74.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.75.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.75.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.75.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.76.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.76.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.76.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.77.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.77.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.77.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.78.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.78.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.78.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.79.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.79.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.79.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.8.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.8.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.8.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.80.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.80.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.80.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.81.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.81.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.81.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.82.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.82.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.82.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.83.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.83.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.83.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.84.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.84.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.84.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.85.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.85.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.85.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.86.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.86.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.86.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.87.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.87.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.87.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.88.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.88.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.88.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.89.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.89.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.89.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.9.down_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.9.gate_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.9.up_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.mlp.experts.90.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.90.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.90.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.91.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.91.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.91.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.92.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.92.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.92.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.93.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.93.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.93.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.94.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.94.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.94.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.95.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.95.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.95.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.96.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.96.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.96.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.97.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.97.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.97.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.98.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.98.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.98.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.99.down_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.99.gate_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.experts.99.up_proj.weight": "model-00119-of-00142.safetensors", + "model.layers.77.mlp.gate.e_score_correction_bias": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.gate.weight": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.shared_experts.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.shared_experts.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.77.mlp.shared_experts.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.77.post_attention_layernorm.weight": "model-00120-of-00142.safetensors", + "model.layers.77.self_attn.k_norm.weight": "model-00118-of-00142.safetensors", + "model.layers.77.self_attn.k_proj.bias": "model-00118-of-00142.safetensors", + "model.layers.77.self_attn.k_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.self_attn.o_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.self_attn.q_norm.weight": "model-00118-of-00142.safetensors", + "model.layers.77.self_attn.q_proj.bias": "model-00118-of-00142.safetensors", + "model.layers.77.self_attn.q_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.77.self_attn.v_proj.bias": "model-00118-of-00142.safetensors", + "model.layers.77.self_attn.v_proj.weight": "model-00118-of-00142.safetensors", + "model.layers.78.input_layernorm.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.0.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.0.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.0.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.1.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.1.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.1.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.10.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.10.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.10.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.100.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.100.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.100.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.101.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.101.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.101.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.102.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.102.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.102.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.103.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.103.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.103.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.104.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.104.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.104.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.105.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.105.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.105.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.106.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.106.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.106.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.107.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.107.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.107.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.108.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.108.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.108.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.109.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.109.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.109.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.11.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.11.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.11.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.110.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.110.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.110.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.111.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.111.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.111.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.112.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.112.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.112.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.113.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.113.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.113.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.114.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.114.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.114.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.115.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.115.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.115.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.116.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.116.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.116.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.117.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.117.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.117.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.118.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.118.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.118.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.119.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.119.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.119.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.12.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.12.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.12.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.120.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.120.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.120.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.121.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.121.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.121.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.122.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.122.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.122.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.123.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.123.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.123.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.124.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.124.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.124.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.125.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.125.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.125.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.126.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.126.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.126.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.127.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.127.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.127.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.128.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.128.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.128.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.129.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.129.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.129.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.13.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.13.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.13.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.130.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.130.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.130.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.131.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.131.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.131.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.132.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.132.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.132.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.133.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.133.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.133.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.134.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.134.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.134.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.135.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.135.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.135.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.136.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.136.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.136.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.137.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.137.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.137.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.138.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.138.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.138.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.139.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.139.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.139.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.14.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.14.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.14.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.140.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.140.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.140.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.141.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.141.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.141.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.142.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.142.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.142.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.143.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.143.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.143.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.144.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.144.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.144.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.145.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.145.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.145.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.146.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.146.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.146.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.147.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.147.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.147.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.148.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.148.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.148.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.149.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.149.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.149.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.15.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.15.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.15.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.150.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.150.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.150.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.151.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.151.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.151.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.152.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.152.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.152.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.153.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.153.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.153.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.154.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.154.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.154.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.155.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.155.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.155.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.156.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.156.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.156.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.157.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.157.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.157.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.158.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.158.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.158.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.159.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.159.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.159.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.16.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.16.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.16.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.17.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.17.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.17.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.18.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.18.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.18.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.19.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.19.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.19.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.2.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.2.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.2.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.20.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.20.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.20.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.21.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.21.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.21.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.22.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.22.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.22.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.23.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.23.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.23.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.24.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.24.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.24.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.25.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.25.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.25.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.26.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.26.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.26.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.27.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.27.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.27.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.28.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.28.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.28.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.29.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.29.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.29.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.3.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.3.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.3.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.30.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.30.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.30.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.31.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.31.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.31.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.32.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.32.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.32.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.33.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.33.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.33.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.34.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.34.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.34.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.35.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.35.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.35.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.36.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.36.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.36.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.37.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.37.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.37.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.38.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.38.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.38.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.39.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.39.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.39.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.4.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.4.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.4.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.40.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.40.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.40.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.41.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.41.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.41.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.42.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.42.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.42.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.43.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.43.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.43.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.44.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.44.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.44.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.45.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.45.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.45.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.46.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.46.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.46.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.47.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.47.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.47.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.48.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.48.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.48.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.49.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.49.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.49.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.5.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.5.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.5.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.50.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.50.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.50.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.51.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.51.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.51.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.52.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.52.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.52.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.53.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.53.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.53.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.54.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.54.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.54.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.55.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.55.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.55.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.56.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.56.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.56.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.57.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.57.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.57.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.58.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.58.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.58.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.59.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.59.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.59.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.6.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.6.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.6.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.60.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.60.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.60.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.61.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.61.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.61.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.62.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.62.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.62.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.63.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.63.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.63.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.64.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.64.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.64.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.65.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.65.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.65.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.66.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.66.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.66.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.67.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.67.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.67.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.68.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.68.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.68.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.69.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.69.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.69.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.7.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.7.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.7.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.70.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.70.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.70.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.71.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.71.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.71.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.72.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.72.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.72.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.73.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.73.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.73.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.74.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.74.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.74.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.75.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.75.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.75.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.76.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.76.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.76.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.77.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.77.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.77.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.78.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.78.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.78.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.79.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.79.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.79.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.8.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.8.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.8.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.80.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.80.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.80.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.81.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.81.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.81.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.82.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.82.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.82.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.83.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.83.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.83.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.84.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.84.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.84.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.85.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.85.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.85.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.86.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.86.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.86.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.87.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.87.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.87.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.88.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.88.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.88.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.89.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.89.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.89.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.9.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.9.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.9.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.90.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.90.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.90.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.91.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.91.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.91.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.92.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.92.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.92.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.93.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.93.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.93.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.94.down_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.94.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.94.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.95.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.95.gate_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.95.up_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.mlp.experts.96.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.96.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.96.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.97.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.97.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.97.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.98.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.98.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.98.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.99.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.99.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.experts.99.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.gate.e_score_correction_bias": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.gate.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.shared_experts.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.shared_experts.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.mlp.shared_experts.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.78.post_attention_layernorm.weight": "model-00121-of-00142.safetensors", + "model.layers.78.self_attn.k_norm.weight": "model-00120-of-00142.safetensors", + "model.layers.78.self_attn.k_proj.bias": "model-00120-of-00142.safetensors", + "model.layers.78.self_attn.k_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.self_attn.o_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.self_attn.q_norm.weight": "model-00120-of-00142.safetensors", + "model.layers.78.self_attn.q_proj.bias": "model-00120-of-00142.safetensors", + "model.layers.78.self_attn.q_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.78.self_attn.v_proj.bias": "model-00120-of-00142.safetensors", + "model.layers.78.self_attn.v_proj.weight": "model-00120-of-00142.safetensors", + "model.layers.79.input_layernorm.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.0.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.0.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.0.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.1.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.1.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.1.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.10.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.10.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.10.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.100.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.100.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.100.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.101.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.101.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.101.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.102.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.102.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.102.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.103.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.103.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.103.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.104.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.104.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.104.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.105.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.105.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.105.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.106.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.106.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.106.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.107.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.107.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.107.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.108.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.108.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.108.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.109.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.109.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.109.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.11.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.11.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.11.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.110.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.110.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.110.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.111.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.111.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.111.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.112.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.112.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.112.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.113.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.113.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.113.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.114.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.114.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.114.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.115.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.115.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.115.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.116.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.116.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.116.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.117.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.117.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.117.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.118.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.118.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.118.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.119.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.119.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.119.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.12.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.12.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.12.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.120.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.120.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.120.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.121.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.121.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.121.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.122.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.122.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.122.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.123.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.123.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.123.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.124.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.124.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.124.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.125.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.125.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.125.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.126.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.126.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.126.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.127.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.127.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.127.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.128.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.128.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.128.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.129.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.129.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.129.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.13.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.13.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.13.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.130.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.130.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.130.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.131.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.131.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.131.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.132.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.132.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.132.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.133.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.133.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.133.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.134.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.134.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.134.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.135.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.135.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.135.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.136.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.136.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.136.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.137.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.137.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.137.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.138.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.138.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.138.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.139.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.139.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.139.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.14.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.14.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.14.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.140.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.140.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.140.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.141.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.141.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.141.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.142.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.142.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.142.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.143.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.143.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.143.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.144.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.144.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.144.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.145.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.145.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.145.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.146.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.146.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.146.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.147.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.147.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.147.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.148.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.148.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.148.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.149.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.149.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.149.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.15.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.15.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.15.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.150.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.150.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.150.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.151.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.151.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.151.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.152.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.152.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.152.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.153.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.153.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.153.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.154.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.154.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.154.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.155.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.155.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.155.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.156.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.156.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.156.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.157.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.157.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.157.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.158.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.158.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.158.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.159.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.159.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.159.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.experts.16.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.16.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.16.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.17.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.17.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.17.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.18.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.18.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.18.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.19.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.19.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.19.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.2.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.2.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.2.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.20.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.20.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.20.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.21.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.21.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.21.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.22.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.22.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.22.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.23.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.23.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.23.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.24.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.24.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.24.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.25.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.25.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.25.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.26.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.26.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.26.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.27.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.27.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.27.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.28.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.28.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.28.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.29.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.29.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.29.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.3.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.3.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.3.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.30.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.30.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.30.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.31.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.31.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.31.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.32.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.32.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.32.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.33.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.33.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.33.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.34.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.34.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.34.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.35.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.35.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.35.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.36.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.36.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.36.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.37.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.37.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.37.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.38.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.38.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.38.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.39.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.39.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.39.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.4.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.4.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.4.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.40.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.40.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.40.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.41.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.41.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.41.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.42.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.42.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.42.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.43.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.43.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.43.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.44.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.44.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.44.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.45.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.45.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.45.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.46.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.46.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.46.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.47.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.47.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.47.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.48.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.48.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.48.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.49.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.49.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.49.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.5.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.5.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.5.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.50.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.50.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.50.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.51.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.51.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.51.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.52.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.52.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.52.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.53.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.53.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.53.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.54.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.54.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.54.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.55.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.55.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.55.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.56.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.56.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.56.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.57.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.57.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.57.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.58.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.58.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.58.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.59.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.59.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.59.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.6.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.6.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.6.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.60.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.60.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.60.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.61.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.61.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.61.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.62.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.62.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.62.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.63.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.63.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.63.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.64.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.64.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.64.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.65.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.65.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.65.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.66.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.66.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.66.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.67.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.67.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.67.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.68.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.68.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.68.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.69.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.69.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.69.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.7.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.7.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.7.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.70.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.70.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.70.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.71.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.71.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.71.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.72.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.72.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.72.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.73.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.73.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.73.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.74.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.74.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.74.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.75.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.75.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.75.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.76.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.76.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.76.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.77.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.77.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.77.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.78.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.78.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.78.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.79.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.79.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.79.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.8.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.8.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.8.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.80.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.80.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.80.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.81.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.81.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.81.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.82.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.82.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.82.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.83.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.83.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.83.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.84.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.84.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.84.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.85.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.85.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.85.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.86.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.86.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.86.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.87.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.87.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.87.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.88.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.88.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.88.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.89.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.89.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.89.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.9.down_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.9.gate_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.9.up_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.mlp.experts.90.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.90.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.90.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.91.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.91.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.91.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.92.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.92.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.92.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.93.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.93.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.93.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.94.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.94.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.94.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.95.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.95.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.95.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.96.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.96.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.96.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.97.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.97.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.97.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.98.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.98.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.98.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.99.down_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.99.gate_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.experts.99.up_proj.weight": "model-00122-of-00142.safetensors", + "model.layers.79.mlp.gate.e_score_correction_bias": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.gate.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.shared_experts.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.shared_experts.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.mlp.shared_experts.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.79.post_attention_layernorm.weight": "model-00123-of-00142.safetensors", + "model.layers.79.self_attn.k_norm.weight": "model-00121-of-00142.safetensors", + "model.layers.79.self_attn.k_proj.bias": "model-00121-of-00142.safetensors", + "model.layers.79.self_attn.k_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.self_attn.o_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.self_attn.q_norm.weight": "model-00121-of-00142.safetensors", + "model.layers.79.self_attn.q_proj.bias": "model-00121-of-00142.safetensors", + "model.layers.79.self_attn.q_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.79.self_attn.v_proj.bias": "model-00121-of-00142.safetensors", + "model.layers.79.self_attn.v_proj.weight": "model-00121-of-00142.safetensors", + "model.layers.8.input_layernorm.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.0.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.0.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.0.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.1.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.1.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.1.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.10.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.10.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.10.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.100.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.100.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.100.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.101.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.101.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.101.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.102.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.102.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.102.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.103.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.103.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.103.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.104.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.104.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.104.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.105.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.105.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.105.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.106.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.106.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.106.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.107.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.107.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.107.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.108.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.108.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.108.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.109.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.109.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.109.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.11.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.11.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.11.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.110.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.110.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.110.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.111.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.111.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.111.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.112.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.112.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.112.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.113.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.113.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.113.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.114.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.114.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.114.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.115.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.115.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.115.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.116.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.116.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.116.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.117.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.117.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.117.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.118.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.118.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.118.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.119.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.119.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.119.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.12.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.12.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.12.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.120.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.120.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.120.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.121.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.121.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.121.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.122.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.122.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.122.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.123.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.123.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.123.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.124.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.124.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.124.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.125.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.125.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.125.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.126.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.126.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.126.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.127.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.127.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.127.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.128.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.128.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.128.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.129.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.129.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.129.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.13.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.13.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.13.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.130.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.130.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.130.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.131.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.131.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.131.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.132.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.132.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.132.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.133.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.133.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.133.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.134.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.134.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.134.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.135.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.135.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.135.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.136.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.136.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.136.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.137.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.137.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.137.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.138.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.138.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.138.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.139.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.139.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.139.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.14.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.14.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.14.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.140.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.140.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.140.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.141.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.141.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.141.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.142.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.142.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.142.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.143.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.143.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.143.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.144.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.144.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.144.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.145.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.145.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.145.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.146.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.146.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.146.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.147.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.147.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.147.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.148.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.148.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.148.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.149.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.149.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.149.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.15.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.15.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.15.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.150.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.150.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.150.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.151.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.151.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.151.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.152.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.152.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.152.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.153.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.153.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.153.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.154.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.154.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.154.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.155.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.155.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.155.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.156.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.156.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.156.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.157.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.157.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.157.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.158.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.158.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.158.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.159.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.159.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.159.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.experts.16.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.16.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.16.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.17.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.17.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.17.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.18.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.18.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.18.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.19.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.19.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.19.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.2.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.2.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.2.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.20.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.20.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.20.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.21.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.21.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.21.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.22.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.22.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.22.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.23.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.23.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.23.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.24.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.24.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.24.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.25.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.25.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.25.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.26.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.26.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.26.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.27.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.27.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.27.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.28.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.28.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.28.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.29.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.29.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.29.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.3.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.3.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.3.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.30.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.30.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.30.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.31.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.31.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.31.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.32.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.32.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.32.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.33.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.33.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.33.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.34.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.34.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.34.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.35.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.35.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.35.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.36.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.36.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.36.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.37.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.37.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.37.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.38.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.38.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.38.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.39.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.39.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.39.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.4.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.4.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.4.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.40.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.40.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.40.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.41.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.41.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.41.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.42.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.42.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.42.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.43.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.43.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.43.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.44.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.44.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.44.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.45.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.45.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.45.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.46.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.46.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.46.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.47.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.47.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.47.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.48.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.48.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.48.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.49.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.49.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.49.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.5.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.5.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.5.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.50.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.50.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.50.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.51.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.51.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.51.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.52.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.52.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.52.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.53.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.53.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.53.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.54.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.54.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.54.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.55.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.55.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.55.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.56.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.56.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.56.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.57.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.57.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.57.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.58.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.58.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.58.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.59.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.59.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.59.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.6.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.6.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.6.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.60.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.60.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.60.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.61.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.61.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.61.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.62.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.62.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.62.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.63.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.63.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.64.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.64.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.65.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.65.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.65.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.66.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.66.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.66.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.67.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.67.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.67.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.68.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.68.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.68.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.69.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.69.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.69.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.7.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.7.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.70.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.70.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.70.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.71.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.71.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.71.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.72.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.72.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.72.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.73.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.73.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.73.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.74.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.74.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.74.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.75.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.75.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.75.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.76.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.76.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.76.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.77.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.77.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.77.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.78.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.78.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.78.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.79.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.79.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.79.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.8.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.8.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.8.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.80.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.80.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.80.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.81.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.81.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.81.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.82.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.82.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.82.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.83.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.83.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.83.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.84.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.84.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.84.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.85.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.85.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.85.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.86.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.86.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.86.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.87.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.87.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.87.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.88.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.88.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.88.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.89.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.89.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.89.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.9.down_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.9.gate_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.9.up_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.mlp.experts.90.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.90.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.90.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.91.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.91.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.91.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.92.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.92.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.92.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.93.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.93.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.93.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.94.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.94.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.94.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.95.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.95.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.95.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.96.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.96.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.96.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.97.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.97.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.97.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.98.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.98.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.98.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.99.down_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.99.gate_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.experts.99.up_proj.weight": "model-00010-of-00142.safetensors", + "model.layers.8.mlp.gate.e_score_correction_bias": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.gate.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.shared_experts.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.shared_experts.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.mlp.shared_experts.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00011-of-00142.safetensors", + "model.layers.8.self_attn.k_norm.weight": "model-00009-of-00142.safetensors", + "model.layers.8.self_attn.k_proj.bias": "model-00009-of-00142.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.self_attn.q_norm.weight": "model-00009-of-00142.safetensors", + "model.layers.8.self_attn.q_proj.bias": "model-00009-of-00142.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.8.self_attn.v_proj.bias": "model-00009-of-00142.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00009-of-00142.safetensors", + "model.layers.80.input_layernorm.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.0.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.0.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.0.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.1.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.1.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.1.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.10.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.10.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.10.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.100.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.100.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.100.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.101.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.101.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.101.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.102.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.102.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.102.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.103.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.103.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.103.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.104.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.104.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.104.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.105.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.105.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.105.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.106.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.106.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.106.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.107.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.107.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.107.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.108.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.108.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.108.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.109.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.109.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.109.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.11.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.11.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.11.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.110.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.110.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.110.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.111.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.111.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.111.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.112.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.112.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.112.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.113.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.113.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.113.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.114.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.114.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.114.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.115.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.115.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.115.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.116.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.116.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.116.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.117.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.117.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.117.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.118.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.118.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.118.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.119.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.119.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.119.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.12.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.12.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.12.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.120.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.120.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.120.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.121.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.121.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.121.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.122.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.122.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.122.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.123.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.123.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.123.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.124.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.124.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.124.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.125.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.125.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.125.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.126.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.126.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.126.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.127.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.127.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.127.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.128.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.128.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.128.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.129.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.129.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.129.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.13.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.13.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.13.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.130.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.130.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.130.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.131.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.131.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.131.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.132.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.132.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.132.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.133.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.133.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.133.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.134.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.134.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.134.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.135.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.135.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.135.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.136.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.136.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.136.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.137.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.137.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.137.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.138.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.138.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.138.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.139.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.139.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.139.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.14.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.14.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.14.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.140.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.140.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.140.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.141.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.141.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.141.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.142.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.142.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.142.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.143.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.143.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.143.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.144.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.144.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.144.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.145.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.145.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.145.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.146.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.146.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.146.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.147.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.147.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.147.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.148.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.148.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.148.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.149.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.149.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.149.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.15.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.15.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.15.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.150.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.150.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.150.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.151.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.151.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.151.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.152.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.152.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.152.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.153.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.153.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.153.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.154.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.154.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.154.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.155.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.155.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.155.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.156.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.156.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.156.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.157.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.157.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.157.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.158.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.158.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.158.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.159.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.159.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.159.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.16.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.16.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.16.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.17.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.17.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.17.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.18.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.18.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.18.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.19.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.19.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.19.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.2.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.2.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.2.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.20.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.20.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.20.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.21.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.21.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.21.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.22.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.22.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.22.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.23.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.23.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.23.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.24.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.24.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.24.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.25.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.25.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.25.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.26.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.26.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.26.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.27.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.27.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.27.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.28.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.28.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.28.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.29.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.29.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.29.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.3.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.3.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.3.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.30.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.30.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.30.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.31.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.31.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.31.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.32.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.32.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.32.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.33.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.33.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.33.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.34.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.34.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.34.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.35.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.35.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.35.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.36.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.36.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.36.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.37.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.37.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.37.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.38.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.38.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.38.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.39.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.39.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.39.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.4.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.4.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.4.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.40.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.40.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.40.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.41.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.41.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.41.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.42.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.42.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.42.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.43.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.43.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.43.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.44.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.44.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.44.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.45.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.45.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.45.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.46.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.46.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.46.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.47.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.47.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.47.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.48.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.48.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.48.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.49.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.49.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.49.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.5.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.5.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.5.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.50.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.50.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.50.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.51.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.51.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.51.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.52.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.52.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.52.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.53.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.53.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.53.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.54.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.54.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.54.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.55.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.55.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.55.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.56.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.56.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.56.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.57.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.57.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.57.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.58.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.58.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.58.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.59.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.59.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.59.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.6.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.6.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.6.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.60.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.60.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.60.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.61.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.61.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.61.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.62.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.62.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.62.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.63.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.63.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.63.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.64.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.64.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.64.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.65.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.65.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.65.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.66.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.66.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.66.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.67.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.67.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.67.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.68.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.68.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.68.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.69.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.69.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.69.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.7.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.7.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.7.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.70.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.70.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.70.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.71.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.71.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.71.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.72.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.72.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.72.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.73.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.73.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.73.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.74.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.74.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.74.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.75.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.75.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.75.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.76.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.76.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.76.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.77.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.77.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.77.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.78.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.78.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.78.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.79.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.79.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.79.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.8.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.8.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.8.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.80.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.80.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.80.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.81.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.81.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.81.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.82.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.82.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.82.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.83.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.83.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.83.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.84.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.84.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.84.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.85.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.85.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.85.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.86.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.86.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.86.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.87.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.87.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.87.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.88.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.88.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.88.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.89.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.89.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.89.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.9.down_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.9.gate_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.9.up_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.mlp.experts.90.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.90.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.90.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.91.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.91.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.91.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.92.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.92.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.92.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.93.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.93.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.93.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.94.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.94.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.94.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.95.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.95.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.95.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.96.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.96.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.96.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.97.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.97.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.97.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.98.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.98.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.98.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.99.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.99.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.experts.99.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.gate.e_score_correction_bias": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.gate.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.shared_experts.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.shared_experts.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.mlp.shared_experts.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.80.post_attention_layernorm.weight": "model-00124-of-00142.safetensors", + "model.layers.80.self_attn.k_norm.weight": "model-00123-of-00142.safetensors", + "model.layers.80.self_attn.k_proj.bias": "model-00123-of-00142.safetensors", + "model.layers.80.self_attn.k_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.self_attn.o_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.self_attn.q_norm.weight": "model-00123-of-00142.safetensors", + "model.layers.80.self_attn.q_proj.bias": "model-00123-of-00142.safetensors", + "model.layers.80.self_attn.q_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.80.self_attn.v_proj.bias": "model-00123-of-00142.safetensors", + "model.layers.80.self_attn.v_proj.weight": "model-00123-of-00142.safetensors", + "model.layers.81.input_layernorm.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.0.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.0.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.0.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.1.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.1.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.1.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.10.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.10.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.10.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.100.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.100.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.100.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.101.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.101.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.101.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.102.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.102.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.102.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.103.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.103.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.103.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.104.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.104.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.104.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.105.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.105.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.105.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.106.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.106.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.106.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.107.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.107.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.107.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.108.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.108.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.108.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.109.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.109.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.109.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.11.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.11.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.11.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.110.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.110.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.110.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.111.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.111.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.111.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.112.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.112.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.112.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.113.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.113.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.113.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.114.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.114.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.114.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.115.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.115.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.115.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.116.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.116.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.116.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.117.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.117.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.117.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.118.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.118.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.118.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.119.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.119.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.119.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.12.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.12.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.12.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.120.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.120.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.120.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.121.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.121.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.121.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.122.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.122.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.122.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.123.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.123.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.123.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.124.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.124.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.124.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.125.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.125.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.125.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.126.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.126.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.126.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.127.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.127.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.127.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.128.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.128.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.128.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.129.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.129.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.129.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.13.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.13.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.13.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.130.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.130.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.130.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.131.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.131.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.131.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.132.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.132.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.132.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.133.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.133.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.133.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.134.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.134.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.134.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.135.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.135.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.135.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.136.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.136.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.136.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.137.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.137.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.137.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.138.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.138.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.138.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.139.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.139.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.139.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.14.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.14.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.14.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.140.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.140.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.140.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.141.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.141.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.141.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.142.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.142.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.142.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.143.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.143.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.143.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.144.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.144.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.144.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.145.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.145.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.145.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.146.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.146.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.146.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.147.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.147.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.147.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.148.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.148.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.148.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.149.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.149.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.149.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.15.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.15.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.15.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.150.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.150.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.150.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.151.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.151.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.151.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.152.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.152.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.152.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.153.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.153.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.153.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.154.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.154.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.154.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.155.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.155.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.155.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.156.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.156.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.156.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.157.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.157.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.157.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.158.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.158.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.158.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.159.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.159.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.159.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.experts.16.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.16.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.16.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.17.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.17.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.17.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.18.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.18.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.18.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.19.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.19.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.19.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.2.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.2.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.2.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.20.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.20.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.20.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.21.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.21.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.21.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.22.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.22.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.22.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.23.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.23.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.23.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.24.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.24.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.24.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.25.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.25.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.25.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.26.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.26.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.26.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.27.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.27.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.27.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.28.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.28.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.28.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.29.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.29.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.29.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.3.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.3.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.3.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.30.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.30.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.30.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.31.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.31.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.31.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.32.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.32.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.32.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.33.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.33.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.33.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.34.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.34.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.34.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.35.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.35.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.35.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.36.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.36.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.36.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.37.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.37.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.37.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.38.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.38.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.38.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.39.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.39.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.39.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.4.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.4.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.4.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.40.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.40.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.40.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.41.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.41.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.41.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.42.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.42.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.42.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.43.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.43.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.43.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.44.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.44.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.44.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.45.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.45.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.45.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.46.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.46.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.46.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.47.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.47.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.47.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.48.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.48.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.48.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.49.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.49.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.49.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.5.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.5.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.5.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.50.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.50.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.50.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.51.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.51.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.51.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.52.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.52.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.52.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.53.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.53.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.53.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.54.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.54.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.54.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.55.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.55.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.55.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.56.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.56.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.56.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.57.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.57.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.57.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.58.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.58.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.58.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.59.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.59.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.59.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.6.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.6.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.6.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.60.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.60.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.60.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.61.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.61.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.61.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.62.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.62.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.62.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.63.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.63.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.63.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.64.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.64.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.64.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.65.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.65.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.65.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.66.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.66.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.66.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.67.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.67.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.67.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.68.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.68.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.68.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.69.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.69.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.69.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.7.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.7.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.7.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.70.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.70.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.70.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.71.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.71.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.71.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.72.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.72.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.72.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.73.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.73.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.73.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.74.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.74.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.74.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.75.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.75.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.75.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.76.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.76.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.76.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.77.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.77.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.77.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.78.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.78.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.78.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.79.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.79.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.79.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.8.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.8.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.8.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.80.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.80.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.80.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.81.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.81.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.81.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.82.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.82.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.82.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.83.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.83.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.83.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.84.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.84.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.84.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.85.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.85.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.85.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.86.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.86.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.86.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.87.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.87.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.87.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.88.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.88.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.88.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.89.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.89.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.89.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.9.down_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.9.gate_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.9.up_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.mlp.experts.90.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.90.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.90.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.91.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.91.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.91.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.92.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.92.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.92.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.93.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.93.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.93.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.94.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.94.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.94.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.95.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.95.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.95.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.96.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.96.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.96.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.97.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.97.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.97.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.98.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.98.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.98.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.99.down_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.99.gate_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.experts.99.up_proj.weight": "model-00125-of-00142.safetensors", + "model.layers.81.mlp.gate.e_score_correction_bias": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.gate.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.shared_experts.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.shared_experts.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.mlp.shared_experts.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.81.post_attention_layernorm.weight": "model-00126-of-00142.safetensors", + "model.layers.81.self_attn.k_norm.weight": "model-00124-of-00142.safetensors", + "model.layers.81.self_attn.k_proj.bias": "model-00124-of-00142.safetensors", + "model.layers.81.self_attn.k_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.self_attn.o_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.self_attn.q_norm.weight": "model-00124-of-00142.safetensors", + "model.layers.81.self_attn.q_proj.bias": "model-00124-of-00142.safetensors", + "model.layers.81.self_attn.q_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.81.self_attn.v_proj.bias": "model-00124-of-00142.safetensors", + "model.layers.81.self_attn.v_proj.weight": "model-00124-of-00142.safetensors", + "model.layers.82.input_layernorm.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.0.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.0.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.0.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.1.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.1.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.1.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.10.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.10.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.10.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.100.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.100.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.100.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.101.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.101.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.101.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.102.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.102.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.102.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.103.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.103.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.103.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.104.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.104.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.104.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.105.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.105.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.105.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.106.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.106.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.106.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.107.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.107.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.107.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.108.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.108.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.108.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.109.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.109.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.109.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.11.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.11.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.11.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.110.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.110.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.110.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.111.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.111.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.111.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.112.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.112.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.112.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.113.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.113.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.113.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.114.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.114.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.114.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.115.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.115.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.115.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.116.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.116.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.116.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.117.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.117.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.117.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.118.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.118.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.118.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.119.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.119.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.119.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.12.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.12.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.12.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.120.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.120.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.120.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.121.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.121.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.121.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.122.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.122.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.122.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.123.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.123.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.123.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.124.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.124.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.124.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.125.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.125.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.125.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.126.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.126.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.126.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.127.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.127.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.127.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.128.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.128.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.128.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.129.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.129.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.129.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.13.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.13.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.13.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.130.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.130.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.130.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.131.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.131.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.131.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.132.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.132.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.132.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.133.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.133.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.133.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.134.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.134.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.134.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.135.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.135.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.135.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.136.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.136.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.136.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.137.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.137.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.137.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.138.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.138.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.138.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.139.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.139.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.139.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.14.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.14.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.14.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.140.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.140.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.140.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.141.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.141.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.141.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.142.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.142.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.142.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.143.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.143.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.143.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.144.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.144.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.144.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.145.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.145.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.145.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.146.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.146.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.146.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.147.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.147.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.147.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.148.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.148.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.148.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.149.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.149.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.149.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.15.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.15.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.15.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.150.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.150.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.150.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.151.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.151.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.151.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.152.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.152.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.152.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.153.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.153.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.153.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.154.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.154.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.154.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.155.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.155.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.155.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.156.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.156.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.156.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.157.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.157.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.157.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.158.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.158.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.158.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.159.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.159.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.159.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.16.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.16.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.16.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.17.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.17.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.17.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.18.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.18.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.18.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.19.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.19.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.19.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.2.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.2.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.2.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.20.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.20.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.20.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.21.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.21.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.21.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.22.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.22.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.22.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.23.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.23.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.23.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.24.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.24.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.24.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.25.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.25.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.25.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.26.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.26.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.26.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.27.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.27.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.27.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.28.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.28.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.28.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.29.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.29.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.29.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.3.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.3.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.3.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.30.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.30.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.30.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.31.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.31.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.31.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.32.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.32.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.32.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.33.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.33.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.33.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.34.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.34.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.34.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.35.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.35.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.35.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.36.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.36.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.36.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.37.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.37.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.37.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.38.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.38.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.38.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.39.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.39.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.39.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.4.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.4.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.4.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.40.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.40.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.40.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.41.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.41.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.41.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.42.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.42.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.42.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.43.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.43.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.43.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.44.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.44.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.44.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.45.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.45.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.45.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.46.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.46.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.46.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.47.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.47.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.47.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.48.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.48.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.48.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.49.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.49.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.49.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.5.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.5.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.5.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.50.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.50.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.50.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.51.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.51.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.51.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.52.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.52.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.52.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.53.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.53.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.53.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.54.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.54.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.54.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.55.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.55.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.55.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.56.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.56.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.56.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.57.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.57.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.57.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.58.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.58.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.58.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.59.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.59.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.59.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.6.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.6.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.6.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.60.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.60.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.60.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.61.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.61.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.61.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.62.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.62.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.62.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.63.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.63.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.63.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.64.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.64.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.64.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.65.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.65.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.65.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.66.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.66.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.66.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.67.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.67.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.67.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.68.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.68.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.68.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.69.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.69.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.69.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.7.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.7.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.7.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.70.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.70.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.70.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.71.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.71.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.71.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.72.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.72.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.72.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.73.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.73.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.73.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.74.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.74.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.74.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.75.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.75.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.75.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.76.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.76.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.76.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.77.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.77.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.77.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.78.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.78.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.78.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.79.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.79.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.79.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.8.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.8.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.8.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.80.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.80.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.80.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.81.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.81.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.81.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.82.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.82.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.82.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.83.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.83.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.83.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.84.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.84.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.84.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.85.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.85.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.85.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.86.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.86.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.86.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.87.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.87.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.87.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.88.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.88.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.88.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.89.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.89.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.89.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.9.down_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.9.gate_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.9.up_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.mlp.experts.90.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.90.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.90.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.91.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.91.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.91.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.92.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.92.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.92.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.93.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.93.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.93.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.94.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.94.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.94.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.95.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.95.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.95.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.96.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.96.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.96.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.97.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.97.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.97.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.98.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.98.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.98.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.99.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.99.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.experts.99.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.gate.e_score_correction_bias": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.gate.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.shared_experts.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.shared_experts.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.mlp.shared_experts.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.82.post_attention_layernorm.weight": "model-00127-of-00142.safetensors", + "model.layers.82.self_attn.k_norm.weight": "model-00126-of-00142.safetensors", + "model.layers.82.self_attn.k_proj.bias": "model-00126-of-00142.safetensors", + "model.layers.82.self_attn.k_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.self_attn.o_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.self_attn.q_norm.weight": "model-00126-of-00142.safetensors", + "model.layers.82.self_attn.q_proj.bias": "model-00126-of-00142.safetensors", + "model.layers.82.self_attn.q_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.82.self_attn.v_proj.bias": "model-00126-of-00142.safetensors", + "model.layers.82.self_attn.v_proj.weight": "model-00126-of-00142.safetensors", + "model.layers.83.input_layernorm.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.0.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.83.mlp.experts.0.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.83.mlp.experts.0.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.83.mlp.experts.1.down_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.83.mlp.experts.1.gate_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.83.mlp.experts.1.up_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.83.mlp.experts.10.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.10.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.10.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.100.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.100.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.100.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.101.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.101.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.101.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.102.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.102.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.102.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.103.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.103.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.103.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.104.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.104.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.104.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.105.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.105.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.105.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.106.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.106.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.106.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.107.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.107.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.107.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.108.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.108.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.108.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.109.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.109.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.109.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.11.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.11.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.11.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.110.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.110.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.110.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.111.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.111.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.111.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.112.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.112.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.112.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.113.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.113.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.113.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.114.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.114.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.114.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.115.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.115.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.115.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.116.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.116.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.116.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.117.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.117.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.117.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.118.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.118.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.118.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.119.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.119.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.119.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.12.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.12.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.12.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.120.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.120.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.120.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.121.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.121.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.121.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.122.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.122.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.122.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.123.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.123.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.123.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.124.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.124.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.124.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.125.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.125.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.125.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.126.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.126.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.126.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.127.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.127.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.127.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.128.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.128.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.128.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.129.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.129.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.129.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.13.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.13.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.13.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.130.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.130.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.130.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.131.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.131.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.131.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.132.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.132.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.132.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.133.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.133.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.133.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.134.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.134.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.134.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.135.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.135.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.135.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.136.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.136.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.136.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.137.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.137.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.137.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.138.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.138.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.138.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.139.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.139.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.139.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.14.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.14.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.14.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.140.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.140.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.140.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.141.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.141.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.141.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.142.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.142.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.142.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.143.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.143.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.143.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.144.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.144.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.144.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.145.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.145.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.145.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.146.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.146.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.146.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.147.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.147.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.147.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.148.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.148.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.148.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.149.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.149.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.149.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.15.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.15.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.15.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.150.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.150.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.150.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.151.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.151.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.151.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.152.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.152.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.152.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.153.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.153.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.153.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.154.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.154.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.154.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.155.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.155.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.155.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.156.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.156.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.156.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.157.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.157.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.157.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.158.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.158.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.158.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.159.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.159.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.159.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.experts.16.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.16.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.16.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.17.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.17.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.17.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.18.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.18.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.18.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.19.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.19.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.19.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.2.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.2.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.2.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.20.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.20.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.20.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.21.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.21.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.21.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.22.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.22.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.22.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.23.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.23.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.23.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.24.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.24.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.24.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.25.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.25.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.25.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.26.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.26.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.26.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.27.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.27.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.27.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.28.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.28.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.28.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.29.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.29.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.29.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.3.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.3.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.3.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.30.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.30.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.30.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.31.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.31.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.31.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.32.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.32.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.32.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.33.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.33.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.33.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.34.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.34.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.34.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.35.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.35.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.35.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.36.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.36.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.36.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.37.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.37.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.37.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.38.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.38.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.38.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.39.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.39.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.39.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.4.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.4.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.4.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.40.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.40.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.40.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.41.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.41.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.41.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.42.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.42.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.42.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.43.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.43.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.43.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.44.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.44.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.44.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.45.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.45.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.45.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.46.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.46.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.46.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.47.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.47.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.47.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.48.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.48.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.48.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.49.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.49.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.49.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.5.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.5.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.5.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.50.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.50.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.50.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.51.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.51.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.51.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.52.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.52.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.52.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.53.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.53.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.53.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.54.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.54.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.54.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.55.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.55.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.55.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.56.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.56.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.56.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.57.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.57.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.57.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.58.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.58.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.58.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.59.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.59.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.59.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.6.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.6.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.6.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.60.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.60.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.60.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.61.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.61.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.61.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.62.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.62.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.62.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.63.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.63.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.63.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.64.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.64.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.64.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.65.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.65.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.65.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.66.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.66.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.66.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.67.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.67.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.67.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.68.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.68.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.68.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.69.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.69.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.69.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.7.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.7.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.7.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.70.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.70.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.70.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.71.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.71.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.71.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.72.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.72.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.72.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.73.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.73.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.73.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.74.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.74.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.74.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.75.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.75.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.75.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.76.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.76.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.76.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.77.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.77.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.77.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.78.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.78.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.78.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.79.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.79.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.79.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.8.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.8.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.8.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.80.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.80.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.80.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.81.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.81.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.81.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.82.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.82.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.82.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.83.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.83.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.83.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.84.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.84.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.84.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.85.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.85.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.85.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.86.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.86.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.86.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.87.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.87.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.87.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.88.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.88.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.88.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.89.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.89.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.89.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.9.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.9.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.9.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.90.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.90.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.90.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.91.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.91.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.91.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.92.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.92.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.92.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.93.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.93.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.93.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.94.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.94.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.94.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.95.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.95.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.95.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.96.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.96.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.96.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.97.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.97.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.97.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.98.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.98.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.98.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.99.down_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.99.gate_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.experts.99.up_proj.weight": "model-00128-of-00142.safetensors", + "model.layers.83.mlp.gate.e_score_correction_bias": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.gate.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.shared_experts.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.shared_experts.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.mlp.shared_experts.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.83.post_attention_layernorm.weight": "model-00129-of-00142.safetensors", + "model.layers.83.self_attn.k_norm.weight": "model-00127-of-00142.safetensors", + "model.layers.83.self_attn.k_proj.bias": "model-00127-of-00142.safetensors", + "model.layers.83.self_attn.k_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.83.self_attn.o_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.83.self_attn.q_norm.weight": "model-00127-of-00142.safetensors", + "model.layers.83.self_attn.q_proj.bias": "model-00127-of-00142.safetensors", + "model.layers.83.self_attn.q_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.83.self_attn.v_proj.bias": "model-00127-of-00142.safetensors", + "model.layers.83.self_attn.v_proj.weight": "model-00127-of-00142.safetensors", + "model.layers.84.input_layernorm.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.0.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.0.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.0.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.1.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.1.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.1.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.10.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.10.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.10.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.100.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.100.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.100.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.101.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.101.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.101.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.102.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.102.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.102.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.103.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.103.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.103.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.104.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.104.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.104.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.105.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.105.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.105.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.106.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.106.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.106.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.107.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.107.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.107.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.108.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.108.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.108.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.109.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.109.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.109.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.11.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.11.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.11.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.110.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.110.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.110.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.111.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.111.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.111.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.112.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.112.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.112.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.113.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.113.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.113.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.114.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.114.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.114.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.115.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.115.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.115.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.116.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.116.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.116.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.117.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.117.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.117.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.118.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.118.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.118.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.119.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.119.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.119.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.12.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.12.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.12.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.120.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.120.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.120.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.121.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.121.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.121.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.122.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.122.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.122.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.123.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.123.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.123.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.124.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.124.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.124.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.125.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.125.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.125.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.126.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.126.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.126.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.127.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.127.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.127.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.128.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.128.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.128.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.129.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.129.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.129.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.13.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.13.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.13.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.130.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.130.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.130.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.131.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.131.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.131.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.132.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.132.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.132.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.133.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.133.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.133.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.134.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.134.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.134.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.135.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.135.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.135.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.136.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.136.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.136.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.137.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.137.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.137.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.138.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.138.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.138.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.139.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.139.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.139.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.14.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.14.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.14.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.140.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.140.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.140.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.141.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.141.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.141.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.142.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.142.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.142.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.143.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.143.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.143.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.144.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.144.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.144.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.145.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.145.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.145.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.146.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.146.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.146.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.147.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.147.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.147.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.148.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.148.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.148.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.149.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.149.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.149.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.15.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.15.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.15.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.150.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.150.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.150.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.151.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.151.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.151.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.152.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.152.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.152.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.153.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.153.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.153.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.154.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.154.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.154.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.155.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.155.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.155.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.156.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.156.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.156.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.157.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.157.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.157.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.158.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.158.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.158.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.159.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.159.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.159.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.experts.16.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.16.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.16.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.17.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.17.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.17.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.18.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.18.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.18.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.19.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.19.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.19.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.2.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.2.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.2.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.20.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.20.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.20.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.21.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.21.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.21.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.22.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.22.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.22.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.23.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.23.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.23.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.24.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.24.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.24.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.25.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.25.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.25.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.26.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.26.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.26.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.27.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.27.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.27.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.28.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.28.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.28.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.29.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.29.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.29.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.3.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.3.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.3.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.30.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.30.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.30.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.31.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.31.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.31.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.32.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.32.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.32.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.33.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.33.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.33.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.34.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.34.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.34.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.35.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.35.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.35.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.36.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.36.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.36.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.37.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.37.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.37.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.38.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.38.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.38.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.39.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.39.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.39.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.4.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.4.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.4.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.40.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.40.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.40.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.41.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.41.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.41.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.42.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.42.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.42.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.43.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.43.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.43.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.44.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.44.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.44.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.45.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.45.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.45.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.46.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.46.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.46.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.47.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.47.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.47.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.48.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.48.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.48.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.49.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.49.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.49.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.5.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.5.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.5.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.50.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.50.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.50.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.51.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.51.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.51.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.52.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.52.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.52.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.53.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.53.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.53.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.54.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.54.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.54.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.55.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.55.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.55.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.56.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.56.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.56.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.57.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.57.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.57.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.58.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.58.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.58.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.59.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.59.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.59.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.6.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.6.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.6.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.60.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.60.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.60.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.61.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.61.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.61.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.62.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.62.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.62.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.63.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.63.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.63.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.64.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.64.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.64.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.65.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.65.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.65.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.66.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.66.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.66.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.67.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.67.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.67.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.68.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.68.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.68.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.69.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.69.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.69.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.7.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.7.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.7.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.70.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.70.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.70.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.71.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.71.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.71.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.72.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.72.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.72.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.73.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.73.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.73.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.74.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.74.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.74.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.75.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.75.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.75.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.76.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.76.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.76.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.77.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.77.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.77.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.78.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.78.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.78.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.79.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.79.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.79.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.8.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.8.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.8.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.80.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.80.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.80.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.81.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.81.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.81.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.82.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.82.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.82.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.83.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.83.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.83.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.84.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.84.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.84.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.85.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.85.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.85.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.86.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.86.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.86.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.87.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.87.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.87.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.88.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.88.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.88.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.89.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.89.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.89.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.9.down_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.9.gate_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.9.up_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.mlp.experts.90.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.90.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.90.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.91.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.91.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.91.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.92.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.92.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.92.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.93.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.93.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.93.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.94.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.94.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.94.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.95.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.95.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.95.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.96.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.96.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.96.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.97.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.97.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.97.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.98.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.98.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.98.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.99.down_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.99.gate_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.experts.99.up_proj.weight": "model-00130-of-00142.safetensors", + "model.layers.84.mlp.gate.e_score_correction_bias": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.gate.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.shared_experts.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.shared_experts.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.mlp.shared_experts.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.84.post_attention_layernorm.weight": "model-00131-of-00142.safetensors", + "model.layers.84.self_attn.k_norm.weight": "model-00129-of-00142.safetensors", + "model.layers.84.self_attn.k_proj.bias": "model-00129-of-00142.safetensors", + "model.layers.84.self_attn.k_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.self_attn.o_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.self_attn.q_norm.weight": "model-00129-of-00142.safetensors", + "model.layers.84.self_attn.q_proj.bias": "model-00129-of-00142.safetensors", + "model.layers.84.self_attn.q_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.84.self_attn.v_proj.bias": "model-00129-of-00142.safetensors", + "model.layers.84.self_attn.v_proj.weight": "model-00129-of-00142.safetensors", + "model.layers.85.input_layernorm.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.0.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.0.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.0.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.1.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.1.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.1.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.10.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.10.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.10.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.100.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.100.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.100.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.101.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.101.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.101.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.102.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.102.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.102.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.103.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.103.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.103.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.104.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.104.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.104.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.105.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.105.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.105.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.106.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.106.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.106.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.107.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.107.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.107.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.108.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.108.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.108.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.109.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.109.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.109.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.11.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.11.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.11.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.110.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.110.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.110.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.111.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.111.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.111.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.112.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.112.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.112.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.113.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.113.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.113.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.114.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.114.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.114.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.115.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.115.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.115.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.116.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.116.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.116.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.117.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.117.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.117.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.118.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.118.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.118.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.119.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.119.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.119.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.12.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.12.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.12.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.120.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.120.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.120.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.121.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.121.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.121.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.122.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.122.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.122.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.123.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.123.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.123.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.124.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.124.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.124.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.125.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.125.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.125.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.126.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.126.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.126.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.127.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.127.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.127.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.128.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.128.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.128.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.129.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.129.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.129.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.13.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.13.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.13.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.130.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.130.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.130.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.131.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.131.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.131.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.132.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.132.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.132.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.133.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.133.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.133.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.134.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.134.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.134.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.135.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.135.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.135.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.136.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.136.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.136.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.137.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.137.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.137.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.138.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.138.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.138.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.139.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.139.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.139.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.14.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.14.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.14.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.140.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.140.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.140.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.141.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.141.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.141.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.142.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.142.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.142.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.143.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.143.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.143.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.144.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.144.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.144.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.145.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.145.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.145.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.146.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.146.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.146.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.147.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.147.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.147.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.148.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.148.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.148.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.149.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.149.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.149.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.15.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.15.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.15.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.150.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.150.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.150.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.151.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.151.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.151.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.152.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.152.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.152.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.153.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.153.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.153.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.154.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.154.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.154.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.155.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.155.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.155.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.156.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.156.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.156.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.157.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.157.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.157.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.158.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.158.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.158.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.159.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.159.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.159.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.16.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.16.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.16.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.17.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.17.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.17.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.18.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.18.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.18.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.19.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.19.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.19.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.2.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.2.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.2.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.20.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.20.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.20.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.21.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.21.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.21.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.22.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.22.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.22.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.23.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.23.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.23.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.24.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.24.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.24.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.25.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.25.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.25.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.26.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.26.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.26.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.27.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.27.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.27.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.28.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.28.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.28.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.29.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.29.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.29.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.3.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.3.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.3.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.30.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.30.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.30.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.31.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.31.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.31.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.32.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.32.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.32.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.33.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.33.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.33.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.34.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.34.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.34.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.35.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.35.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.35.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.36.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.36.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.36.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.37.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.37.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.37.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.38.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.38.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.38.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.39.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.39.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.39.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.4.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.4.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.4.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.40.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.40.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.40.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.41.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.41.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.41.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.42.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.42.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.42.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.43.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.43.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.43.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.44.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.44.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.44.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.45.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.45.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.45.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.46.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.46.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.46.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.47.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.47.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.47.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.48.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.48.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.48.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.49.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.49.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.49.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.5.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.5.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.5.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.50.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.50.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.50.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.51.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.51.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.51.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.52.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.52.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.52.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.53.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.53.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.53.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.54.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.54.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.54.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.55.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.55.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.55.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.56.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.56.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.56.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.57.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.57.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.57.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.58.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.58.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.58.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.59.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.59.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.59.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.6.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.6.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.6.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.60.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.60.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.60.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.61.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.61.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.61.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.62.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.62.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.62.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.63.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.63.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.63.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.64.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.64.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.64.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.65.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.65.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.65.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.66.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.66.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.66.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.67.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.67.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.67.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.68.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.68.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.68.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.69.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.69.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.69.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.7.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.7.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.7.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.70.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.70.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.70.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.71.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.71.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.71.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.72.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.72.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.72.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.73.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.73.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.73.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.74.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.74.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.74.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.75.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.75.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.75.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.76.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.76.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.76.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.77.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.77.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.77.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.78.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.78.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.78.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.79.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.79.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.79.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.8.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.8.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.8.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.80.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.80.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.80.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.81.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.81.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.81.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.82.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.82.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.82.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.83.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.83.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.83.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.84.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.84.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.84.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.85.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.85.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.85.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.86.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.86.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.86.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.87.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.87.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.87.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.88.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.88.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.88.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.89.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.89.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.89.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.9.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.9.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.9.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.90.down_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.90.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.90.up_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.91.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.91.gate_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.mlp.experts.91.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.92.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.92.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.92.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.93.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.93.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.93.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.94.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.94.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.94.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.95.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.95.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.95.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.96.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.96.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.96.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.97.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.97.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.97.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.98.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.98.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.98.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.99.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.99.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.experts.99.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.gate.e_score_correction_bias": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.gate.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.shared_experts.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.shared_experts.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.mlp.shared_experts.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.85.post_attention_layernorm.weight": "model-00132-of-00142.safetensors", + "model.layers.85.self_attn.k_norm.weight": "model-00131-of-00142.safetensors", + "model.layers.85.self_attn.k_proj.bias": "model-00131-of-00142.safetensors", + "model.layers.85.self_attn.k_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.self_attn.o_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.self_attn.q_norm.weight": "model-00131-of-00142.safetensors", + "model.layers.85.self_attn.q_proj.bias": "model-00131-of-00142.safetensors", + "model.layers.85.self_attn.q_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.85.self_attn.v_proj.bias": "model-00131-of-00142.safetensors", + "model.layers.85.self_attn.v_proj.weight": "model-00131-of-00142.safetensors", + "model.layers.86.input_layernorm.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.0.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.0.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.0.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.1.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.1.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.1.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.10.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.10.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.10.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.100.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.100.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.100.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.101.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.101.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.101.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.102.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.102.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.102.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.103.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.103.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.103.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.104.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.104.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.104.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.105.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.105.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.105.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.106.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.106.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.106.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.107.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.107.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.107.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.108.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.108.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.108.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.109.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.109.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.109.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.11.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.11.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.11.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.110.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.110.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.110.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.111.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.111.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.111.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.112.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.112.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.112.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.113.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.113.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.113.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.114.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.114.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.114.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.115.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.115.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.115.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.116.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.116.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.116.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.117.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.117.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.117.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.118.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.118.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.118.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.119.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.119.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.119.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.12.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.12.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.12.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.120.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.120.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.120.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.121.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.121.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.121.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.122.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.122.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.122.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.123.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.123.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.123.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.124.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.124.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.124.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.125.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.125.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.125.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.126.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.126.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.126.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.127.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.127.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.127.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.128.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.128.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.128.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.129.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.129.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.129.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.13.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.13.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.13.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.130.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.130.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.130.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.131.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.131.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.131.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.132.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.132.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.132.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.133.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.133.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.133.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.134.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.134.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.134.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.135.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.135.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.135.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.136.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.136.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.136.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.137.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.137.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.137.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.138.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.138.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.138.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.139.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.139.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.139.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.14.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.14.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.14.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.140.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.140.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.140.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.141.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.141.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.141.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.142.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.142.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.142.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.143.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.143.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.143.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.144.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.144.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.144.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.145.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.145.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.145.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.146.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.146.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.146.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.147.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.147.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.147.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.148.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.148.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.148.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.149.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.149.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.149.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.15.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.15.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.15.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.150.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.150.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.150.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.151.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.151.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.151.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.152.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.152.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.152.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.153.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.153.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.153.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.154.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.154.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.154.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.155.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.155.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.155.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.156.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.156.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.156.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.157.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.157.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.157.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.158.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.158.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.158.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.159.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.159.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.159.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.experts.16.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.16.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.16.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.17.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.17.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.17.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.18.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.18.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.18.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.19.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.19.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.19.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.2.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.2.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.2.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.20.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.20.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.20.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.21.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.21.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.21.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.22.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.22.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.22.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.23.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.23.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.23.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.24.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.24.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.24.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.25.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.25.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.25.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.26.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.26.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.26.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.27.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.27.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.27.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.28.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.28.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.28.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.29.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.29.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.29.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.3.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.3.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.3.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.30.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.30.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.30.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.31.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.31.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.31.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.32.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.32.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.32.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.33.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.33.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.33.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.34.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.34.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.34.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.35.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.35.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.35.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.36.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.36.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.36.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.37.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.37.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.37.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.38.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.38.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.38.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.39.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.39.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.39.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.4.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.4.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.4.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.40.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.40.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.40.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.41.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.41.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.41.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.42.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.42.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.42.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.43.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.43.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.43.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.44.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.44.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.44.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.45.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.45.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.45.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.46.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.46.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.46.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.47.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.47.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.47.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.48.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.48.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.48.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.49.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.49.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.49.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.5.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.5.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.5.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.50.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.50.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.50.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.51.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.51.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.51.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.52.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.52.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.52.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.53.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.53.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.53.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.54.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.54.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.54.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.55.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.55.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.55.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.56.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.56.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.56.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.57.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.57.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.57.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.58.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.58.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.58.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.59.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.59.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.59.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.6.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.6.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.6.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.60.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.60.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.60.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.61.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.61.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.61.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.62.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.62.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.62.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.63.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.63.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.63.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.64.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.64.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.64.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.65.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.65.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.65.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.66.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.66.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.66.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.67.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.67.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.67.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.68.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.68.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.68.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.69.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.69.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.69.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.7.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.7.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.7.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.70.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.70.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.70.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.71.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.71.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.71.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.72.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.72.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.72.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.73.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.73.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.73.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.74.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.74.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.74.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.75.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.75.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.75.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.76.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.76.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.76.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.77.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.77.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.77.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.78.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.78.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.78.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.79.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.79.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.79.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.8.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.8.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.8.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.80.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.80.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.80.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.81.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.81.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.81.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.82.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.82.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.82.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.83.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.83.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.83.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.84.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.84.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.84.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.85.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.85.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.85.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.86.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.86.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.86.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.87.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.87.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.87.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.88.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.88.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.88.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.89.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.89.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.89.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.9.down_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.9.gate_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.9.up_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.mlp.experts.90.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.90.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.90.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.91.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.91.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.91.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.92.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.92.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.92.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.93.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.93.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.93.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.94.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.94.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.94.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.95.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.95.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.95.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.96.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.96.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.96.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.97.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.97.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.97.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.98.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.98.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.98.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.99.down_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.99.gate_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.experts.99.up_proj.weight": "model-00133-of-00142.safetensors", + "model.layers.86.mlp.gate.e_score_correction_bias": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.gate.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.shared_experts.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.shared_experts.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.mlp.shared_experts.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.86.post_attention_layernorm.weight": "model-00134-of-00142.safetensors", + "model.layers.86.self_attn.k_norm.weight": "model-00132-of-00142.safetensors", + "model.layers.86.self_attn.k_proj.bias": "model-00132-of-00142.safetensors", + "model.layers.86.self_attn.k_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.self_attn.o_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.self_attn.q_norm.weight": "model-00132-of-00142.safetensors", + "model.layers.86.self_attn.q_proj.bias": "model-00132-of-00142.safetensors", + "model.layers.86.self_attn.q_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.86.self_attn.v_proj.bias": "model-00132-of-00142.safetensors", + "model.layers.86.self_attn.v_proj.weight": "model-00132-of-00142.safetensors", + "model.layers.87.input_layernorm.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.0.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.0.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.0.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.1.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.1.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.1.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.10.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.10.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.10.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.100.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.100.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.100.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.101.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.101.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.101.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.102.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.102.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.102.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.103.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.103.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.103.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.104.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.104.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.104.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.105.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.105.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.105.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.106.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.106.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.106.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.107.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.107.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.107.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.108.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.108.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.108.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.109.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.109.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.109.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.11.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.11.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.11.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.110.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.110.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.110.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.111.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.111.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.111.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.112.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.112.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.112.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.113.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.113.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.113.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.114.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.114.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.114.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.115.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.115.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.115.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.116.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.116.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.116.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.117.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.117.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.117.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.118.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.118.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.118.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.119.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.119.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.119.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.12.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.12.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.12.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.120.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.120.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.120.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.121.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.121.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.121.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.122.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.122.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.122.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.123.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.123.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.123.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.124.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.124.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.124.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.125.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.125.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.125.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.126.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.126.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.126.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.127.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.127.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.127.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.128.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.128.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.128.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.129.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.129.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.129.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.13.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.13.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.13.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.130.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.130.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.130.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.131.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.131.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.131.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.132.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.132.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.132.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.133.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.133.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.133.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.134.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.134.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.134.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.135.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.135.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.135.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.136.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.136.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.136.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.137.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.137.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.137.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.138.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.138.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.138.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.139.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.139.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.139.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.14.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.14.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.14.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.140.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.140.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.140.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.141.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.141.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.141.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.142.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.142.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.142.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.143.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.143.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.143.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.144.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.144.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.144.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.145.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.145.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.145.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.146.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.146.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.146.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.147.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.147.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.147.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.148.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.148.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.148.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.149.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.149.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.149.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.15.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.15.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.15.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.150.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.150.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.150.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.151.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.151.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.151.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.152.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.152.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.152.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.153.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.153.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.153.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.154.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.154.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.154.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.155.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.155.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.155.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.156.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.156.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.156.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.157.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.157.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.157.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.158.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.158.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.158.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.159.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.159.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.159.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.16.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.16.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.16.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.17.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.17.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.17.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.18.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.18.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.18.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.19.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.19.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.19.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.2.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.2.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.2.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.20.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.20.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.20.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.21.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.21.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.21.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.22.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.22.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.22.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.23.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.23.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.23.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.24.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.24.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.24.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.25.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.25.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.25.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.26.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.26.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.26.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.27.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.27.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.27.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.28.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.28.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.28.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.29.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.29.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.29.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.3.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.3.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.3.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.30.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.30.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.30.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.31.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.31.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.31.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.32.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.32.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.32.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.33.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.33.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.33.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.34.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.34.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.34.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.35.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.35.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.35.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.36.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.36.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.36.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.37.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.37.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.37.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.38.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.38.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.38.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.39.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.39.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.39.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.4.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.4.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.4.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.40.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.40.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.40.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.41.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.41.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.41.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.42.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.42.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.42.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.43.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.43.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.43.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.44.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.44.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.44.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.45.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.45.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.45.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.46.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.46.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.46.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.47.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.47.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.47.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.48.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.48.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.48.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.49.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.49.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.49.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.5.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.5.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.5.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.50.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.50.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.50.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.51.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.51.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.51.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.52.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.52.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.52.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.53.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.53.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.53.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.54.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.54.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.54.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.55.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.55.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.55.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.56.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.56.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.56.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.57.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.57.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.57.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.58.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.58.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.58.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.59.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.59.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.59.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.6.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.6.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.6.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.60.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.60.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.60.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.61.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.61.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.61.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.62.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.62.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.62.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.63.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.63.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.63.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.64.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.64.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.64.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.65.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.65.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.65.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.66.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.66.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.66.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.67.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.67.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.67.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.68.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.68.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.68.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.69.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.69.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.69.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.7.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.7.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.7.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.70.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.70.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.70.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.71.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.71.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.71.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.72.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.72.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.72.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.73.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.73.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.73.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.74.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.74.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.74.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.75.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.75.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.75.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.76.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.76.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.76.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.77.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.77.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.77.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.78.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.78.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.78.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.79.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.79.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.79.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.8.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.8.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.8.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.80.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.80.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.80.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.81.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.81.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.81.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.82.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.82.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.82.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.83.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.83.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.83.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.84.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.84.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.84.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.85.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.85.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.85.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.86.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.86.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.86.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.87.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.87.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.87.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.88.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.88.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.88.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.89.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.89.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.89.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.9.down_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.9.gate_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.9.up_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.mlp.experts.90.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.90.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.90.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.91.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.91.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.91.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.92.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.92.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.92.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.93.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.93.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.93.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.94.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.94.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.94.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.95.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.95.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.95.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.96.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.96.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.96.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.97.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.97.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.97.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.98.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.98.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.98.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.99.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.99.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.experts.99.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.gate.e_score_correction_bias": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.gate.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.shared_experts.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.shared_experts.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.mlp.shared_experts.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.87.post_attention_layernorm.weight": "model-00135-of-00142.safetensors", + "model.layers.87.self_attn.k_norm.weight": "model-00134-of-00142.safetensors", + "model.layers.87.self_attn.k_proj.bias": "model-00134-of-00142.safetensors", + "model.layers.87.self_attn.k_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.self_attn.o_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.self_attn.q_norm.weight": "model-00134-of-00142.safetensors", + "model.layers.87.self_attn.q_proj.bias": "model-00134-of-00142.safetensors", + "model.layers.87.self_attn.q_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.87.self_attn.v_proj.bias": "model-00134-of-00142.safetensors", + "model.layers.87.self_attn.v_proj.weight": "model-00134-of-00142.safetensors", + "model.layers.88.input_layernorm.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.0.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.0.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.0.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.1.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.1.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.1.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.10.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.10.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.10.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.100.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.100.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.100.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.101.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.101.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.101.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.102.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.102.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.102.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.103.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.103.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.103.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.104.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.104.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.104.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.105.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.105.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.105.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.106.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.106.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.106.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.107.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.107.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.107.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.108.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.108.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.108.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.109.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.109.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.109.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.11.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.11.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.11.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.110.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.110.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.110.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.111.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.111.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.111.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.112.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.112.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.112.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.113.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.113.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.113.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.114.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.114.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.114.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.115.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.115.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.115.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.116.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.116.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.116.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.117.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.117.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.117.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.118.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.118.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.118.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.119.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.119.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.119.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.12.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.12.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.12.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.120.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.120.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.120.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.121.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.121.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.121.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.122.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.122.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.122.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.123.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.123.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.123.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.124.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.124.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.124.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.125.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.125.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.125.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.126.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.126.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.126.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.127.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.127.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.127.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.128.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.128.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.128.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.129.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.129.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.129.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.13.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.13.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.13.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.130.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.130.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.130.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.131.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.131.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.131.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.132.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.132.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.132.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.133.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.133.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.133.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.134.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.134.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.134.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.135.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.135.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.135.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.136.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.136.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.136.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.137.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.137.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.137.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.138.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.138.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.138.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.139.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.139.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.139.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.14.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.14.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.14.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.140.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.140.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.140.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.141.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.141.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.141.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.142.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.142.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.142.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.143.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.143.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.143.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.144.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.144.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.144.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.145.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.145.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.145.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.146.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.146.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.146.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.147.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.147.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.147.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.148.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.148.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.148.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.149.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.149.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.149.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.15.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.15.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.15.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.150.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.150.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.150.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.151.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.151.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.151.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.152.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.152.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.152.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.153.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.153.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.153.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.154.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.154.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.154.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.155.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.155.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.155.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.156.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.156.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.156.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.157.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.157.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.157.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.158.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.158.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.158.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.159.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.159.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.159.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.experts.16.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.16.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.16.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.17.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.17.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.17.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.18.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.18.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.18.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.19.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.19.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.19.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.2.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.2.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.2.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.20.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.20.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.20.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.21.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.21.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.21.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.22.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.22.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.22.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.23.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.23.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.23.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.24.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.24.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.24.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.25.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.25.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.25.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.26.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.26.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.26.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.27.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.27.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.27.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.28.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.28.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.28.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.29.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.29.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.29.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.3.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.3.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.3.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.30.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.30.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.30.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.31.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.31.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.31.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.32.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.32.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.32.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.33.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.33.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.33.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.34.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.34.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.34.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.35.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.35.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.35.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.36.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.36.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.36.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.37.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.37.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.37.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.38.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.38.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.38.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.39.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.39.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.39.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.4.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.4.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.4.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.40.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.40.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.40.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.41.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.41.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.41.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.42.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.42.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.42.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.43.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.43.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.43.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.44.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.44.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.44.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.45.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.45.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.45.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.46.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.46.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.46.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.47.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.47.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.47.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.48.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.48.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.48.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.49.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.49.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.49.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.5.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.5.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.5.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.50.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.50.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.50.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.51.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.51.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.51.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.52.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.52.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.52.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.53.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.53.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.53.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.54.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.54.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.54.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.55.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.55.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.55.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.56.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.56.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.56.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.57.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.57.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.57.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.58.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.58.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.58.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.59.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.59.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.59.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.6.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.6.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.6.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.60.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.60.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.60.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.61.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.61.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.61.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.62.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.62.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.62.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.63.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.63.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.63.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.64.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.64.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.64.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.65.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.65.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.65.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.66.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.66.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.66.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.67.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.67.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.67.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.68.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.68.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.68.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.69.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.69.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.69.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.7.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.7.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.7.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.70.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.70.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.70.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.71.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.71.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.71.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.72.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.72.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.72.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.73.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.73.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.73.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.74.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.74.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.74.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.75.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.75.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.75.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.76.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.76.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.76.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.77.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.77.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.77.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.78.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.78.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.78.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.79.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.79.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.79.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.8.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.8.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.8.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.80.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.80.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.80.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.81.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.81.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.81.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.82.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.82.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.82.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.83.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.83.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.83.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.84.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.84.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.84.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.85.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.85.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.85.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.86.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.86.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.86.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.87.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.87.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.87.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.88.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.88.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.88.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.89.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.89.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.89.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.9.down_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.9.gate_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.9.up_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.mlp.experts.90.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.90.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.90.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.91.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.91.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.91.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.92.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.92.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.92.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.93.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.93.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.93.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.94.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.94.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.94.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.95.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.95.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.95.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.96.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.96.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.96.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.97.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.97.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.97.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.98.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.98.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.98.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.99.down_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.99.gate_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.experts.99.up_proj.weight": "model-00136-of-00142.safetensors", + "model.layers.88.mlp.gate.e_score_correction_bias": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.gate.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.shared_experts.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.shared_experts.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.mlp.shared_experts.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.88.post_attention_layernorm.weight": "model-00137-of-00142.safetensors", + "model.layers.88.self_attn.k_norm.weight": "model-00135-of-00142.safetensors", + "model.layers.88.self_attn.k_proj.bias": "model-00135-of-00142.safetensors", + "model.layers.88.self_attn.k_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.self_attn.o_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.self_attn.q_norm.weight": "model-00135-of-00142.safetensors", + "model.layers.88.self_attn.q_proj.bias": "model-00135-of-00142.safetensors", + "model.layers.88.self_attn.q_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.88.self_attn.v_proj.bias": "model-00135-of-00142.safetensors", + "model.layers.88.self_attn.v_proj.weight": "model-00135-of-00142.safetensors", + "model.layers.89.input_layernorm.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.0.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.0.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.0.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.1.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.1.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.1.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.10.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.10.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.10.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.100.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.100.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.100.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.101.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.101.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.101.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.102.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.102.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.102.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.103.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.103.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.103.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.104.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.104.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.104.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.105.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.105.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.105.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.106.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.106.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.106.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.107.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.107.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.107.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.108.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.108.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.108.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.109.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.109.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.109.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.11.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.11.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.11.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.110.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.110.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.110.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.111.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.111.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.111.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.112.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.112.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.112.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.113.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.113.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.113.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.114.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.114.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.114.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.115.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.115.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.115.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.116.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.116.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.116.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.117.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.117.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.117.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.118.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.118.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.118.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.119.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.119.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.119.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.12.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.12.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.12.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.120.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.120.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.120.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.121.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.121.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.121.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.122.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.122.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.122.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.123.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.123.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.123.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.124.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.124.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.124.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.125.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.125.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.125.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.126.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.126.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.126.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.127.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.127.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.127.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.128.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.128.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.128.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.129.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.129.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.129.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.13.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.13.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.13.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.130.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.130.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.130.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.131.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.131.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.131.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.132.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.132.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.132.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.133.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.133.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.133.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.134.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.134.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.134.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.135.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.135.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.135.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.136.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.136.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.136.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.137.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.137.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.137.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.138.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.138.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.138.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.139.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.139.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.139.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.14.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.14.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.14.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.140.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.140.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.140.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.141.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.141.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.141.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.142.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.142.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.142.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.143.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.143.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.143.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.144.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.144.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.144.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.145.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.145.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.145.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.146.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.146.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.146.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.147.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.147.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.147.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.148.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.148.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.148.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.149.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.149.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.149.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.15.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.15.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.15.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.150.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.150.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.150.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.151.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.151.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.151.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.152.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.152.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.152.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.153.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.153.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.153.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.154.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.154.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.154.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.155.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.155.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.155.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.156.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.156.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.156.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.157.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.157.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.157.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.158.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.158.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.158.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.159.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.159.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.159.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.16.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.16.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.16.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.17.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.17.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.17.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.18.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.18.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.18.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.19.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.19.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.19.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.2.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.2.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.2.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.20.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.20.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.20.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.21.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.21.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.21.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.22.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.22.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.22.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.23.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.23.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.23.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.24.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.24.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.24.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.25.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.25.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.25.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.26.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.26.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.26.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.27.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.27.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.27.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.28.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.28.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.28.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.29.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.29.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.29.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.3.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.3.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.3.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.30.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.30.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.30.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.31.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.31.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.31.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.32.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.32.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.32.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.33.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.33.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.33.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.34.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.34.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.34.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.35.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.35.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.35.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.36.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.36.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.36.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.37.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.37.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.37.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.38.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.38.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.38.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.39.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.39.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.39.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.4.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.4.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.4.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.40.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.40.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.40.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.41.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.41.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.41.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.42.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.42.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.42.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.43.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.43.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.43.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.44.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.44.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.44.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.45.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.45.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.45.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.46.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.46.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.46.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.47.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.47.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.47.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.48.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.48.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.48.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.49.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.49.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.49.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.5.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.5.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.5.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.50.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.50.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.50.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.51.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.51.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.51.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.52.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.52.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.52.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.53.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.53.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.53.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.54.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.54.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.54.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.55.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.55.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.55.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.56.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.56.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.56.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.57.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.57.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.57.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.58.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.58.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.58.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.59.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.59.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.59.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.6.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.6.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.6.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.60.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.60.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.60.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.61.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.61.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.61.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.62.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.62.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.62.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.63.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.63.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.63.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.64.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.64.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.64.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.65.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.65.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.65.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.66.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.66.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.66.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.67.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.67.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.67.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.68.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.68.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.68.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.69.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.69.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.69.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.7.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.7.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.7.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.70.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.70.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.70.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.71.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.71.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.71.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.72.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.72.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.72.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.73.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.73.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.73.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.74.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.74.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.74.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.75.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.75.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.75.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.76.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.76.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.76.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.77.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.77.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.77.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.78.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.78.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.78.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.79.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.79.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.79.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.8.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.8.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.8.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.80.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.80.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.80.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.81.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.81.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.81.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.82.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.82.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.82.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.83.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.83.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.83.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.84.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.84.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.84.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.85.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.85.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.85.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.86.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.86.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.86.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.87.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.87.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.87.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.88.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.88.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.88.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.89.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.89.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.89.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.9.down_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.9.gate_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.9.up_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.mlp.experts.90.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.90.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.90.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.91.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.91.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.91.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.92.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.92.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.92.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.93.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.93.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.93.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.94.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.94.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.94.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.95.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.95.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.95.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.96.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.96.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.96.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.97.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.97.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.97.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.98.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.98.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.98.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.99.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.99.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.experts.99.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.gate.e_score_correction_bias": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.gate.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.shared_experts.down_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.shared_experts.gate_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.mlp.shared_experts.up_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.89.post_attention_layernorm.weight": "model-00138-of-00142.safetensors", + "model.layers.89.self_attn.k_norm.weight": "model-00137-of-00142.safetensors", + "model.layers.89.self_attn.k_proj.bias": "model-00137-of-00142.safetensors", + "model.layers.89.self_attn.k_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.self_attn.o_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.self_attn.q_norm.weight": "model-00137-of-00142.safetensors", + "model.layers.89.self_attn.q_proj.bias": "model-00137-of-00142.safetensors", + "model.layers.89.self_attn.q_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.89.self_attn.v_proj.bias": "model-00137-of-00142.safetensors", + "model.layers.89.self_attn.v_proj.weight": "model-00137-of-00142.safetensors", + "model.layers.9.input_layernorm.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.0.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.0.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.1.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.1.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.10.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.10.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.10.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.100.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.100.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.100.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.101.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.101.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.101.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.102.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.102.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.102.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.103.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.103.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.103.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.104.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.104.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.104.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.105.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.105.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.105.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.106.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.106.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.106.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.107.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.107.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.107.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.108.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.108.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.108.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.109.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.109.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.109.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.11.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.11.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.11.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.110.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.110.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.110.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.111.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.111.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.111.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.112.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.112.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.112.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.113.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.113.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.113.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.114.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.114.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.114.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.115.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.115.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.115.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.116.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.116.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.116.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.117.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.117.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.117.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.118.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.118.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.118.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.119.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.119.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.119.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.12.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.12.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.12.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.120.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.120.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.120.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.121.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.121.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.121.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.122.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.122.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.122.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.123.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.123.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.123.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.124.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.124.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.124.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.125.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.125.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.125.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.126.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.126.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.126.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.127.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.127.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.127.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.128.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.128.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.128.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.129.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.129.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.129.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.13.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.13.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.13.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.130.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.130.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.130.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.131.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.131.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.131.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.132.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.132.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.132.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.133.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.133.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.133.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.134.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.134.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.134.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.135.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.135.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.135.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.136.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.136.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.136.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.137.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.137.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.137.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.138.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.138.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.138.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.139.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.139.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.139.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.14.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.14.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.14.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.140.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.140.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.140.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.141.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.141.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.141.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.142.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.142.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.142.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.143.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.143.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.143.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.144.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.144.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.144.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.145.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.145.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.145.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.146.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.146.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.146.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.147.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.147.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.147.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.148.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.148.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.148.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.149.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.149.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.149.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.15.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.15.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.15.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.150.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.150.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.150.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.151.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.151.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.151.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.152.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.152.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.152.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.153.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.153.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.153.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.154.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.154.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.154.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.155.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.155.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.155.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.156.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.156.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.156.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.157.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.157.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.157.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.158.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.158.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.158.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.159.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.159.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.159.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.16.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.16.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.16.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.17.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.17.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.17.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.18.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.18.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.18.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.19.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.19.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.19.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.2.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.2.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.20.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.20.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.20.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.21.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.21.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.21.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.22.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.22.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.22.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.23.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.23.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.23.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.24.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.24.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.24.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.25.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.25.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.25.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.26.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.26.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.26.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.27.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.27.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.27.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.28.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.28.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.28.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.29.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.29.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.29.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.3.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.3.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.30.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.30.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.30.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.31.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.31.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.31.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.32.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.32.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.32.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.33.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.33.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.33.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.34.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.34.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.34.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.35.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.35.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.35.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.36.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.36.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.36.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.37.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.37.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.37.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.38.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.38.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.38.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.39.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.39.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.39.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.4.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.4.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.40.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.40.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.40.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.41.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.41.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.41.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.42.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.42.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.42.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.43.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.43.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.43.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.44.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.44.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.44.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.45.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.45.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.45.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.46.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.46.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.46.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.47.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.47.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.47.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.48.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.48.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.48.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.49.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.49.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.49.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.5.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.5.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.50.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.50.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.50.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.51.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.51.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.51.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.52.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.52.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.52.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.53.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.53.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.53.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.54.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.54.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.54.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.55.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.55.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.55.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.56.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.56.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.56.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.57.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.57.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.57.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.58.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.58.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.58.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.59.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.59.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.59.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.6.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.6.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.60.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.60.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.60.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.61.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.61.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.61.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.62.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.62.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.62.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.63.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.63.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.64.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.64.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.65.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.65.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.65.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.66.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.66.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.66.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.67.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.67.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.67.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.68.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.68.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.68.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.69.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.69.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.69.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.7.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.7.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.70.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.70.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.70.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.71.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.71.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.71.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.72.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.72.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.72.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.73.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.73.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.73.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.74.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.74.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.74.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.75.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.75.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.75.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.76.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.76.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.76.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.77.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.77.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.77.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.78.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.78.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.78.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.79.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.79.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.79.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.8.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.8.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.8.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.80.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.80.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.80.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.81.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.81.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.81.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.82.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.82.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.82.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.83.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.83.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.83.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.84.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.84.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.84.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.85.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.85.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.85.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.86.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.86.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.86.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.87.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.87.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.87.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.88.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.88.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.88.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.89.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.89.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.89.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.9.down_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.9.gate_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.9.up_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.mlp.experts.90.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.90.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.90.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.91.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.91.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.91.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.92.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.92.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.92.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.93.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.93.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.93.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.94.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.94.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.94.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.95.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.95.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.95.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.96.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.96.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.96.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.97.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.97.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.97.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.98.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.98.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.98.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.99.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.99.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.experts.99.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.gate.e_score_correction_bias": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.gate.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.shared_experts.down_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.shared_experts.gate_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.mlp.shared_experts.up_proj.weight": "model-00012-of-00142.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00012-of-00142.safetensors", + "model.layers.9.self_attn.k_norm.weight": "model-00011-of-00142.safetensors", + "model.layers.9.self_attn.k_proj.bias": "model-00011-of-00142.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.self_attn.q_norm.weight": "model-00011-of-00142.safetensors", + "model.layers.9.self_attn.q_proj.bias": "model-00011-of-00142.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.9.self_attn.v_proj.bias": "model-00011-of-00142.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00011-of-00142.safetensors", + "model.layers.90.input_layernorm.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.0.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.0.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.0.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.1.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.1.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.1.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.10.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.10.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.10.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.100.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.100.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.100.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.101.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.101.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.101.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.102.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.102.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.102.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.103.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.103.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.103.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.104.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.104.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.104.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.105.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.105.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.105.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.106.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.106.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.106.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.107.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.107.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.107.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.108.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.108.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.108.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.109.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.109.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.109.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.11.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.11.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.11.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.110.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.110.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.110.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.111.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.111.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.111.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.112.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.112.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.112.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.113.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.113.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.113.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.114.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.114.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.114.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.115.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.115.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.115.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.116.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.116.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.116.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.117.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.117.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.117.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.118.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.118.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.118.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.119.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.119.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.119.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.12.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.12.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.12.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.120.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.120.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.120.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.121.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.121.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.121.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.122.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.122.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.122.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.123.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.123.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.123.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.124.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.124.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.124.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.125.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.125.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.125.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.126.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.126.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.126.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.127.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.127.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.127.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.128.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.128.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.128.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.129.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.129.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.129.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.13.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.13.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.13.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.130.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.130.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.130.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.131.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.131.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.131.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.132.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.132.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.132.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.133.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.133.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.133.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.134.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.134.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.134.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.135.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.135.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.135.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.136.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.136.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.136.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.137.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.137.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.137.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.138.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.138.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.138.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.139.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.139.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.139.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.14.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.14.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.14.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.140.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.140.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.140.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.141.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.141.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.141.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.142.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.142.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.142.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.143.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.143.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.143.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.144.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.144.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.144.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.145.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.145.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.145.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.146.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.146.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.146.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.147.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.147.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.147.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.148.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.148.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.148.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.149.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.149.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.149.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.15.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.15.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.15.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.150.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.150.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.150.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.151.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.151.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.151.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.152.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.152.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.152.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.153.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.153.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.153.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.154.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.154.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.154.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.155.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.155.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.155.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.156.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.156.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.156.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.157.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.157.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.157.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.158.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.158.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.158.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.159.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.159.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.159.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.experts.16.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.16.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.16.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.17.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.17.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.17.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.18.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.18.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.18.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.19.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.19.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.19.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.2.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.2.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.2.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.20.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.20.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.20.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.21.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.21.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.21.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.22.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.22.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.22.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.23.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.23.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.23.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.24.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.24.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.24.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.25.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.25.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.25.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.26.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.26.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.26.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.27.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.27.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.27.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.28.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.28.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.28.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.29.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.29.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.29.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.3.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.3.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.3.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.30.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.30.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.30.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.31.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.31.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.31.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.32.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.32.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.32.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.33.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.33.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.33.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.34.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.34.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.34.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.35.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.35.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.35.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.36.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.36.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.36.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.37.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.37.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.37.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.38.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.38.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.38.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.39.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.39.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.39.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.4.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.4.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.4.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.40.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.40.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.40.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.41.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.41.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.41.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.42.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.42.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.42.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.43.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.43.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.43.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.44.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.44.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.44.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.45.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.45.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.45.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.46.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.46.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.46.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.47.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.47.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.47.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.48.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.48.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.48.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.49.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.49.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.49.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.5.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.5.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.5.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.50.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.50.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.50.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.51.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.51.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.51.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.52.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.52.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.52.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.53.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.53.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.53.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.54.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.54.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.54.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.55.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.55.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.55.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.56.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.56.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.56.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.57.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.57.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.57.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.58.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.58.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.58.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.59.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.59.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.59.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.6.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.6.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.6.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.60.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.60.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.60.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.61.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.61.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.61.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.62.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.62.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.62.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.63.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.63.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.63.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.64.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.64.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.64.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.65.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.65.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.65.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.66.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.66.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.66.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.67.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.67.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.67.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.68.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.68.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.68.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.69.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.69.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.69.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.7.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.7.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.7.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.70.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.70.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.70.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.71.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.71.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.71.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.72.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.72.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.72.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.73.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.73.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.73.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.74.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.74.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.74.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.75.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.75.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.75.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.76.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.76.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.76.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.77.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.77.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.77.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.78.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.78.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.78.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.79.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.79.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.79.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.8.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.8.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.8.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.80.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.80.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.80.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.81.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.81.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.81.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.82.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.82.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.82.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.83.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.83.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.83.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.84.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.84.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.84.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.85.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.85.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.85.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.86.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.86.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.86.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.87.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.87.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.87.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.88.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.88.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.88.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.89.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.89.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.89.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.9.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.9.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.9.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.90.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.90.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.90.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.91.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.91.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.91.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.92.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.92.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.92.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.93.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.93.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.93.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.94.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.94.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.94.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.95.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.95.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.95.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.96.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.96.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.96.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.97.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.97.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.97.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.98.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.98.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.98.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.99.down_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.99.gate_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.experts.99.up_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.mlp.gate.e_score_correction_bias": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.gate.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.shared_experts.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.shared_experts.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.mlp.shared_experts.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.90.post_attention_layernorm.weight": "model-00140-of-00142.safetensors", + "model.layers.90.self_attn.k_norm.weight": "model-00139-of-00142.safetensors", + "model.layers.90.self_attn.k_proj.bias": "model-00138-of-00142.safetensors", + "model.layers.90.self_attn.k_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.90.self_attn.o_proj.weight": "model-00139-of-00142.safetensors", + "model.layers.90.self_attn.q_norm.weight": "model-00139-of-00142.safetensors", + "model.layers.90.self_attn.q_proj.bias": "model-00138-of-00142.safetensors", + "model.layers.90.self_attn.q_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.90.self_attn.v_proj.bias": "model-00138-of-00142.safetensors", + "model.layers.90.self_attn.v_proj.weight": "model-00138-of-00142.safetensors", + "model.layers.91.input_layernorm.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.0.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.0.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.0.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.1.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.1.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.1.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.10.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.10.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.10.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.100.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.100.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.100.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.101.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.101.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.101.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.102.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.102.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.102.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.103.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.103.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.103.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.104.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.104.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.104.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.105.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.105.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.105.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.106.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.106.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.106.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.107.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.107.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.107.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.108.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.108.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.108.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.109.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.109.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.109.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.11.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.11.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.11.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.110.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.110.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.110.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.111.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.111.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.111.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.112.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.112.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.112.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.113.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.113.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.113.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.114.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.114.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.114.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.115.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.115.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.115.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.116.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.116.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.116.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.117.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.117.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.117.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.118.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.118.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.118.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.119.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.119.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.119.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.12.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.12.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.12.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.120.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.120.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.120.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.121.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.121.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.121.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.122.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.122.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.122.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.123.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.123.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.123.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.124.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.124.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.124.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.125.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.125.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.125.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.126.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.126.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.126.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.127.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.127.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.127.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.128.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.128.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.128.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.129.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.129.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.129.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.13.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.13.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.13.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.130.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.130.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.130.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.131.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.131.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.131.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.132.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.132.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.132.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.133.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.133.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.133.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.134.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.134.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.134.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.135.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.135.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.135.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.136.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.136.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.136.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.137.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.137.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.137.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.138.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.138.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.138.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.139.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.139.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.139.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.14.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.14.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.14.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.140.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.140.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.140.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.141.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.141.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.141.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.142.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.142.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.142.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.143.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.143.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.143.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.144.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.144.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.144.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.145.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.145.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.145.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.146.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.146.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.146.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.147.down_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.147.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.147.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.148.down_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.148.gate_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.148.up_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.149.down_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.149.gate_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.149.up_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.15.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.15.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.15.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.150.down_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.150.gate_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.150.up_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.151.down_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.151.gate_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.151.up_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.152.down_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.152.gate_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.152.up_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.153.down_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.153.gate_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.153.up_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.154.down_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.154.gate_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.154.up_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.155.down_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.155.gate_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.155.up_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.156.down_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.156.gate_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.156.up_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.157.down_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.157.gate_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.157.up_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.158.down_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.158.gate_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.158.up_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.159.down_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.159.gate_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.159.up_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.experts.16.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.16.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.16.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.17.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.17.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.17.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.18.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.18.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.18.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.19.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.19.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.19.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.2.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.2.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.2.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.20.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.20.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.20.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.21.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.21.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.21.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.22.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.22.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.22.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.23.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.23.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.23.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.24.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.24.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.24.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.25.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.25.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.25.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.26.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.26.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.26.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.27.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.27.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.27.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.28.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.28.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.28.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.29.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.29.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.29.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.3.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.3.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.3.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.30.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.30.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.30.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.31.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.31.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.31.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.32.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.32.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.32.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.33.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.33.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.33.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.34.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.34.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.34.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.35.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.35.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.35.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.36.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.36.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.36.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.37.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.37.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.37.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.38.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.38.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.38.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.39.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.39.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.39.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.4.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.4.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.4.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.40.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.40.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.40.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.41.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.41.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.41.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.42.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.42.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.42.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.43.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.43.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.43.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.44.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.44.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.44.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.45.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.45.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.45.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.46.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.46.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.46.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.47.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.47.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.47.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.48.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.48.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.48.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.49.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.49.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.49.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.5.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.5.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.5.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.50.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.50.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.50.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.51.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.51.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.51.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.52.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.52.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.52.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.53.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.53.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.53.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.54.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.54.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.54.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.55.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.55.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.55.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.56.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.56.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.56.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.57.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.57.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.57.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.58.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.58.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.58.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.59.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.59.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.59.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.6.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.6.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.6.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.60.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.60.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.60.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.61.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.61.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.61.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.62.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.62.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.62.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.63.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.63.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.63.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.64.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.64.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.64.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.65.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.65.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.65.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.66.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.66.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.66.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.67.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.67.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.67.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.68.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.68.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.68.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.69.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.69.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.69.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.7.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.7.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.7.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.70.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.70.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.70.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.71.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.71.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.71.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.72.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.72.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.72.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.73.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.73.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.73.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.74.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.74.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.74.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.75.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.75.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.75.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.76.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.76.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.76.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.77.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.77.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.77.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.78.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.78.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.78.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.79.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.79.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.79.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.8.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.8.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.8.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.80.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.80.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.80.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.81.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.81.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.81.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.82.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.82.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.82.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.83.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.83.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.83.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.84.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.84.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.84.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.85.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.85.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.85.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.86.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.86.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.86.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.87.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.87.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.87.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.88.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.88.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.88.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.89.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.89.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.89.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.9.down_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.9.gate_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.9.up_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.mlp.experts.90.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.90.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.90.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.91.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.91.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.91.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.92.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.92.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.92.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.93.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.93.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.93.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.94.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.94.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.94.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.95.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.95.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.95.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.96.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.96.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.96.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.97.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.97.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.97.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.98.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.98.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.98.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.99.down_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.99.gate_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.experts.99.up_proj.weight": "model-00141-of-00142.safetensors", + "model.layers.91.mlp.gate.e_score_correction_bias": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.gate.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.shared_experts.down_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.shared_experts.gate_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.mlp.shared_experts.up_proj.weight": "model-00142-of-00142.safetensors", + "model.layers.91.post_attention_layernorm.weight": "model-00142-of-00142.safetensors", + "model.layers.91.self_attn.k_norm.weight": "model-00140-of-00142.safetensors", + "model.layers.91.self_attn.k_proj.bias": "model-00140-of-00142.safetensors", + "model.layers.91.self_attn.k_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.self_attn.o_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.self_attn.q_norm.weight": "model-00140-of-00142.safetensors", + "model.layers.91.self_attn.q_proj.bias": "model-00140-of-00142.safetensors", + "model.layers.91.self_attn.q_proj.weight": "model-00140-of-00142.safetensors", + "model.layers.91.self_attn.v_proj.bias": "model-00140-of-00142.safetensors", + "model.layers.91.self_attn.v_proj.weight": "model-00140-of-00142.safetensors", + "model.norm.weight": "model-00142-of-00142.safetensors" + } +} diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..9028cf84013844f17d7616bdec1d88e977924434 --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,40 @@ +{ + "additional_special_tokens": [ + "<|endoftext|>", + "[MASK]", + "[gMASK]", + "[sMASK]", + "", + "", + "<|system|>", + "<|user|>", + "<|assistant|>", + "<|observation|>", + "<|begin_of_image|>", + "<|end_of_image|>", + "<|begin_of_video|>", + "<|end_of_video|>", + "<|begin_of_audio|>", + "<|end_of_audio|>", + "<|begin_of_transcription|>", + "<|end_of_transcription|>", + "<|code_prefix|>", + "<|code_middle|>", + "<|code_suffix|>", + "/nothink" + ], + "eos_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..e3ed3c66baf1ec4de61840b0abf02142687bfed8 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bda8e2146c3bb7b7e0fc96dcc4f0aeff041c6c27952e3ace0665663ebff346ba +size 19970700 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..75e11cfb2e0cc09f19391ec2278b4825a4c3fae9 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,325 @@ +{ + "added_tokens_decoder": { + "151329": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151330": { + "content": "[MASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151331": { + "content": "[gMASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151332": { + "content": "[sMASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151333": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151334": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151335": { + "content": "<|system|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151336": { + "content": "<|user|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151337": { + "content": "<|assistant|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151338": { + "content": "<|observation|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151339": { + "content": "<|begin_of_image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151340": { + "content": "<|end_of_image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151341": { + "content": "<|begin_of_video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151342": { + "content": "<|end_of_video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151343": { + "content": "<|begin_of_audio|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151344": { + "content": "<|end_of_audio|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151345": { + "content": "<|begin_of_transcription|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151346": { + "content": "<|end_of_transcription|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151347": { + "content": "<|code_prefix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151348": { + "content": "<|code_middle|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151349": { + "content": "<|code_suffix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151350": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151351": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151352": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151353": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151354": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151355": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151356": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151357": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151358": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151359": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151360": { + "content": "/nothink", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151361": { + "content": "<|begin_of_box|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151362": { + "content": "<|end_of_box|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151363": { + "content": "<|image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151364": { + "content": "<|video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "additional_special_tokens": [ + "<|endoftext|>", + "[MASK]", + "[gMASK]", + "[sMASK]", + "", + "", + "<|system|>", + "<|user|>", + "<|assistant|>", + "<|observation|>", + "<|begin_of_image|>", + "<|end_of_image|>", + "<|begin_of_video|>", + "<|end_of_video|>", + "<|begin_of_audio|>", + "<|end_of_audio|>", + "<|begin_of_transcription|>", + "<|end_of_transcription|>", + "<|code_prefix|>", + "<|code_middle|>", + "<|code_suffix|>", + "/nothink" + ], + "clean_up_tokenization_spaces": false, + "do_lower_case": false, + "eos_token": "<|endoftext|>", + "extra_special_tokens": {}, + "model_max_length": 128000, + "pad_token": "<|endoftext|>", + "padding_side": "left", + "remove_space": false, + "tokenizer_class": "PreTrainedTokenizerFast" +}